#!/usr/bin/env python3
"""
ThoughtSpot Deployment Module

A comprehensive tool for deploying data models to ThoughtSpot:
- Creates Snowflake connections
- Parses DDL and creates tables
- Generates and deploys models

Usage:
    from thoughtspot_deployer import ThoughtSpotDeployer
    
    deployer = ThoughtSpotDeployer()
    results = deployer.deploy_all(ddl, database, schema)
"""

import os
from supabase_client import get_admin_setting
import re
import yaml
import json
import requests
import snowflake.connector
from datetime import datetime
from typing import Dict, List, Optional, Tuple
from dotenv import load_dotenv
from snowflake_auth import get_snowflake_connection_params

# Load environment variables
load_dotenv()


def _safe_print(*args, **kwargs):
    """Print that ignores BrokenPipeError - prevents crashes when output is closed."""
    try:
        print(*args, **kwargs)
    except BrokenPipeError:
        pass


def _apply_naming_style(name: str, style: str = "snake_case") -> str:
    """
    Convert column name to specified naming style for ThoughtSpot display.
    
    Args:
        name: Original column name
        style: Naming style - one of: Regular Case, snake_case, camelCase, PascalCase, UPPER_CASE, original
    
    Examples (for "SHIPPING_MODE"):
        Regular Case → Shipping Mode
        snake_case   → shipping_mode
        camelCase    → shippingMode
        PascalCase   → ShippingMode
        UPPER_CASE   → SHIPPING_MODE
        original     → SHIPPING_MODE (unchanged)
    """
    name = name.strip()
    
    if style == "original":
        return name
    
    if style == "UPPER_CASE":
        return name.upper().replace(" ", "_")
    
    # Split into words (handle underscores, spaces, and camelCase)
    import re
    # Split on underscores, spaces, or camelCase boundaries
    words = re.split(r'[_\s]+', name)
    # Further split camelCase words
    expanded_words = []
    for word in words:
        # Split on camelCase boundaries (e.g., "firstName" -> ["first", "Name"])
        parts = re.findall(r'[A-Z]?[a-z]+|[A-Z]+(?=[A-Z][a-z]|\d|\W|$)|\d+', word)
        if parts:
            expanded_words.extend(parts)
        else:
            expanded_words.append(word)
    
    words = [w.lower() for w in expanded_words if w]
    
    if not words:
        return name.lower()
    
    if style == "Regular Case":
        # Title case each word, join with spaces: STATE_ID -> State Id
        return " ".join(w.capitalize() for w in words)
    
    if style == "snake_case":
        return "_".join(words)
    
    elif style == "camelCase":
        # First word lowercase, rest capitalized
        return words[0] + "".join(w.capitalize() for w in words[1:])
    
    elif style == "PascalCase":
        # All words capitalized
        return "".join(w.capitalize() for w in words)
    
    else:
        # Default to snake_case
        return "_".join(words)


def _to_snake_case(name: str) -> str:
    """
    Legacy function - converts to snake_case.
    Use _apply_naming_style() for more options.
    """
    return _apply_naming_style(name, "snake_case")


class ThoughtSpotDeployer:
    """ThoughtSpot deployment automation"""
    
    def __init__(self, base_url: str = None, username: str = None, secret_key: str = None):
        """
        Initialize ThoughtSpot deployer (trusted auth only)
        
        Reads from environment variables if not passed directly.
        Env vars are populated from Supabase admin settings at login time.
        Raises ValueError if any required setting is missing.
        """
        self.base_url = base_url if base_url else get_admin_setting('THOUGHTSPOT_URL')
        if not username:
            raise ValueError("ThoughtSpotDeployer requires username — pass the logged-in user's email")
        self.username = username
        if not secret_key:
            raise ValueError("ThoughtSpotDeployer requires secret_key — pass the trusted auth key for the selected environment")
        self.secret_key = secret_key
        
        # Snowflake connection details from environment (key pair auth)
        self.sf_account = get_admin_setting('SNOWFLAKE_ACCOUNT')
        self.sf_user = get_admin_setting('SNOWFLAKE_KP_USER')
        self.sf_role = get_admin_setting('SNOWFLAKE_ROLE')
        self.sf_warehouse = get_admin_setting('SNOWFLAKE_WAREHOUSE')
        
        self.headers = {
            'Content-Type': 'application/json',
            'X-Requested-By': 'ThoughtSpot'
        }
        
        # Use session to maintain cookies between requests
        self.session = requests.Session()
        self.session.headers.update(self.headers)
        
        # Column naming style for ThoughtSpot model columns
        # Options: Regular Case, snake_case, camelCase, PascalCase, UPPER_CASE, original
        self.column_naming_style = "Regular Case"

        # Per-session prompt logger — set by the chat controller after construction
        self.prompt_logger = None
        
        # Validate credentials for trusted auth
        if not all([self.base_url, self.username, self.secret_key]):
            raise ValueError("Missing ThoughtSpot URL, username, or trusted auth key")
        
        if not all([self.sf_account, self.sf_user, self.sf_role, self.sf_warehouse]):
            raise ValueError("Missing required Snowflake credentials in environment variables")
    
    def _get_private_key_for_thoughtspot(self) -> str:
        """Get private key in format suitable for ThoughtSpot TML"""
        private_key_raw = get_admin_setting('SNOWFLAKE_KP_PK')
        
        if not private_key_raw:
            raise ValueError("SNOWFLAKE_KP_PK environment variable not set")
        
        # ThoughtSpot expects the private key as raw PEM format string
        if not private_key_raw.startswith('-----BEGIN'):
            # If it's base64 encoded, decode it
            import base64
            try:
                private_key_raw = base64.b64decode(private_key_raw).decode('utf-8')
            except Exception:
                pass
        
        return private_key_raw

    def authenticate(self) -> bool:
        """Authenticate with ThoughtSpot using trusted authentication"""
        return self.authenticate_trusted()
    
    def authenticate_trusted(self) -> bool:
        """Authenticate with ThoughtSpot using trusted authentication (secret key)"""
        try:
            auth_url = f"{self.base_url}/api/rest/2.0/auth/token/full"
            print(f"   🔐 Attempting trusted authentication to: {auth_url}")
            print(f"   👤 Username: {self.username}")
            print(f"   🔑 Using secret key: {self.secret_key[:8]}...{self.secret_key[-4:]}" if self.secret_key and len(self.secret_key) > 12 else "   🔑 Using secret key")
            
            response = self.session.post(
                auth_url,
                json={
                    "username": self.username,
                    "secret_key": self.secret_key,
                    "validity_time_in_sec": 3600  # 1 hour token
                }
            )
            
            print(f"   📡 HTTP Status: {response.status_code}")
            
            if response.status_code == 200:
                result = response.json()
                if 'token' in result:
                    # Use the token as bearer auth
                    self.session.headers['Authorization'] = f'Bearer {result["token"]}'
                    print("   ✅ Trusted authentication successful (bearer token)")
                    return True
                else:
                    print(f"   ❌ No token in response: {result}")
                    return False
            elif response.status_code == 204:
                # Session cookie auth
                print("   ✅ Trusted authentication successful (session cookies)")
                return True
            else:
                print(f"   ❌ HTTP Error {response.status_code}: {response.text}")
                return False
            
        except Exception as e:
            print(f"   💥 Trusted authentication exception: {e}")
            return False

    def authenticate_oauth(self, timeout: int = 120) -> bool:
        """
        Authenticate with ThoughtSpot using browser-based SSO (Okta, SAML, etc.)
        
        Opens browser to ThoughtSpot login, user authenticates via SSO,
        and cookies are captured via a local callback server.
        
        Args:
            timeout: Seconds to wait for authentication (default 120)
            
        Returns:
            True if authentication successful, False otherwise
        """
        import webbrowser
        import http.server
        import socketserver
        import threading
        import urllib.parse
        
        print(f"   🔐 Starting OAuth/SSO authentication for: {self.base_url}")
        print(f"   👤 User: {self.username or 'SSO user'}")
        
        # Find an available port for the callback server
        callback_port = 8765
        for port in range(8765, 8800):
            try:
                with socketserver.TCPServer(("", port), None) as test:
                    callback_port = port
                    break
            except OSError:
                continue
        
        callback_url = f"http://localhost:{callback_port}/callback"
        auth_complete = threading.Event()
        auth_success = [False]  # Use list to allow modification in nested function
        
        class OAuthCallbackHandler(http.server.BaseHTTPRequestHandler):
            def log_message(self, format, *args):
                pass  # Suppress logging
                
            def do_GET(self):
                if self.path.startswith('/callback'):
                    # Authentication completed - show success page
                    self.send_response(200)
                    self.send_header('Content-type', 'text/html')
                    self.end_headers()
                    
                    # Page that extracts cookies and displays success
                    html = """
                    <!DOCTYPE html>
                    <html>
                    <head>
                        <title>ThoughtSpot Authentication</title>
                        <style>
                            body { font-family: -apple-system, BlinkMacSystemFont, 'Segoe UI', sans-serif; 
                                   display: flex; justify-content: center; align-items: center; 
                                   height: 100vh; margin: 0; background: #f5f5f5; }
                            .container { text-align: center; background: white; padding: 40px; 
                                        border-radius: 10px; box-shadow: 0 2px 10px rgba(0,0,0,0.1); }
                            .success { color: #28a745; font-size: 48px; }
                            h1 { color: #333; }
                            p { color: #666; }
                        </style>
                    </head>
                    <body>
                        <div class="container">
                            <div class="success">✓</div>
                            <h1>Authentication Successful!</h1>
                            <p>You can close this window and return to the application.</p>
                        </div>
                    </body>
                    </html>
                    """
                    self.wfile.write(html.encode())
                    auth_success[0] = True
                    auth_complete.set()
                    
                elif self.path == '/check':
                    # Health check endpoint
                    self.send_response(200)
                    self.send_header('Content-type', 'text/plain')
                    self.end_headers()
                    self.wfile.write(b'OK')
                else:
                    self.send_response(404)
                    self.end_headers()
        
        # Start callback server in background thread
        server = socketserver.TCPServer(("", callback_port), OAuthCallbackHandler)
        server_thread = threading.Thread(target=server.handle_request)
        server_thread.daemon = True
        server_thread.start()
        
        # Build the SSO login URL
        # ThoughtSpot redirects to SSO provider, then back to ThoughtSpot, then to our callback
        ts_login_url = f"{self.base_url}/?redirectURL={urllib.parse.quote(callback_url)}"
        
        print(f"   🌐 Opening browser for SSO login...")
        print(f"   📍 Callback URL: {callback_url}")
        print(f"   ⏳ Waiting up to {timeout} seconds for authentication...")
        
        # Open browser to ThoughtSpot login
        webbrowser.open(ts_login_url)
        
        # Wait for authentication to complete
        if auth_complete.wait(timeout=timeout):
            if auth_success[0]:
                print("   ✅ Browser authentication completed!")
                
                # Now we need to get the session from ThoughtSpot
                # The user authenticated in the browser, so we need to get a session token
                # We'll use the session/token endpoint to get a token for API calls
                
                # Try to get a session token using the trusted auth flow
                # Since user is now logged in via browser, we attempt to get session info
                try:
                    # Check if session is valid by calling a simple API endpoint
                    # First, let's try to get current user info
                    user_response = self.session.get(
                        f"{self.base_url}/api/rest/2.0/auth/session/user",
                        timeout=10
                    )
                    
                    if user_response.status_code == 200:
                        user_info = user_response.json()
                        print(f"   ✅ Session active for: {user_info.get('name', 'unknown')}")
                        return True
                    else:
                        # Browser auth completed but we don't have cookies in our session
                        # This is expected - browser and Python have separate cookie jars
                        print("   ⚠️  Browser authenticated but Python session needs cookies")
                        print("   💡 For full OAuth support, please use the browser-based workflow")
                        print("   💡 Or configure trusted authentication on ThoughtSpot")
                        return False
                        
                except Exception as e:
                    print(f"   ⚠️  Could not verify session: {e}")
                    return False
            else:
                print("   ❌ Authentication callback received but marked as failed")
                return False
        else:
            print("   ❌ Authentication timed out")
            server.shutdown()
            return False

    def get_model_columns(self, model_guid: str) -> List[Dict]:
        """
        Get actual column names from a ThoughtSpot model.
        
        This is important because ThoughtSpot may rename columns to make them unique
        (e.g., PROCESSING_FEE becomes gift_processing_fee and tran_processing_fee).
        
        Args:
            model_guid: GUID of the ThoughtSpot model
            
        Returns:
            List of column dicts with 'name' and 'type' keys
        """
        try:
            # Export the model TML to get actual column names
            export_response = self.session.post(
                f"{self.base_url}/api/rest/2.0/metadata/tml/export",
                json={
                    'metadata': [{'identifier': model_guid}],
                    'export_associated': False
                }
            )
            
            if export_response.status_code != 200:
                print(f"   ⚠️ Could not export model TML: HTTP {export_response.status_code}")
                return []
            
            tml_data = export_response.json()
            if not tml_data or len(tml_data) == 0:
                print(f"   ⚠️ Empty TML export response")
                return []
            
            # Parse YAML TML
            tml_str = tml_data[0].get('edoc', '')
            model_tml = yaml.safe_load(tml_str)
            
            if not model_tml or 'model' not in model_tml:
                print(f"   ⚠️ Invalid model TML structure")
                return []
            
            # Extract columns with their actual names from the model
            columns = []
            for col in model_tml.get('model', {}).get('columns', []):
                col_name = col.get('name', '')
                col_props = col.get('properties', {})
                col_type = col_props.get('column_type', 'ATTRIBUTE')
                
                # Map ThoughtSpot column types to SQL-like types for AI understanding
                if col_type == 'MEASURE':
                    sql_type = 'NUMBER'  # Measures are numeric
                elif col_props.get('calendar'):
                    sql_type = 'DATE'    # Calendar attribute = date column
                else:
                    sql_type = 'VARCHAR'  # Other attributes are typically strings

                columns.append({
                    'name': col_name,
                    'type': sql_type,
                    'ts_type': col_type  # Keep original for reference
                })
            
            print(f"   📊 Got {len(columns)} columns from ThoughtSpot model")
            return columns
            
        except Exception as e:
            print(f"   ⚠️ Error getting model columns: {e}")
            return []

    def parse_ddl(self, ddl: str) -> Tuple[Dict, List]:
        """
        Parse DDL to extract table definitions and foreign key relationships
        
        Returns:
            Tuple of (tables_dict, foreign_keys_list)
        """
        tables = {}
        foreign_keys = []
        
        # Find all CREATE TABLE statements
        table_pattern = (
            r'CREATE\s+TABLE\s+(?:IF\s+NOT\s+EXISTS\s+)?'
            r'(?:"?([A-Za-z0-9_]+)"?)\s*\((.*?)\)\s*;'
        )
        
        for match in re.finditer(table_pattern, ddl, re.IGNORECASE | re.DOTALL):
            table_name = match.group(1).upper()
            columns_text = match.group(2)
            
            columns = []
            # Parse each column definition - PROPERLY FIXED parsing
            # Split by comma but be careful of commas inside parentheses
            column_lines = []
            current_line = ""
            paren_count = 0
            
            for char in columns_text:
                if char == '(':
                    paren_count += 1
                elif char == ')':
                    paren_count -= 1
                elif char == ',' and paren_count == 0:
                    column_lines.append(current_line.strip())
                    current_line = ""
                    continue
                current_line += char
            
            # Add the last line
            if current_line.strip():
                column_lines.append(current_line.strip())
            
            for line in column_lines:
                line = line.strip()
                line_upper = line.upper()

                def _normalize_table_name(raw_name: str) -> str:
                    # Handle optional quoting and optional DB/SCHEMA qualifiers.
                    normalized = raw_name.replace('"', '').strip()
                    if '.' in normalized:
                        normalized = normalized.split('.')[-1]
                    return normalized.upper()

                # Parse FK constraints in any common table-level form:
                # 1) FOREIGN KEY (COL) REFERENCES TBL(COL)
                # 2) CONSTRAINT FK_NAME FOREIGN KEY (COL) REFERENCES TBL(COL)
                fk_match = re.search(
                    r'FOREIGN\s+KEY\s*\((\w+)\)\s*REFERENCES\s+([A-Za-z0-9_".]+)\s*\((\w+)\)',
                    line,
                    re.IGNORECASE
                )
                if fk_match:
                    from_col = fk_match.group(1).upper()
                    to_table = _normalize_table_name(fk_match.group(2))
                    to_col = fk_match.group(3).upper()
                    foreign_keys.append({
                        'from_table': table_name,
                        'from_column': from_col,
                        'to_table': to_table,
                        'to_column': to_col
                    })
                    print(f"   🔗 Found FK: {table_name}.{from_col} -> {to_table}.{to_col}")
                    continue

                # Parse inline FK form in column definitions:
                # COL_NAME <TYPE...> REFERENCES TARGET_TABLE(TARGET_COL)
                inline_fk_match = re.search(
                    r'^(\w+)\s+.+?\s+REFERENCES\s+([A-Za-z0-9_".]+)\s*\((\w+)\)',
                    line,
                    re.IGNORECASE
                )
                if inline_fk_match:
                    from_col = inline_fk_match.group(1).upper()
                    to_table = _normalize_table_name(inline_fk_match.group(2))
                    to_col = inline_fk_match.group(3).upper()
                    foreign_keys.append({
                        'from_table': table_name,
                        'from_column': from_col,
                        'to_table': to_table,
                        'to_column': to_col
                    })
                    print(f"   🔗 Found inline FK: {table_name}.{from_col} -> {to_table}.{to_col}")

                if not line_upper.startswith(('PRIMARY KEY', 'CONSTRAINT', 'FOREIGN KEY', 'UNIQUE', 'CHECK', 'INDEX')):
                    # Parse: COLUMNNAME DATATYPE(params) [IDENTITY] [NOT NULL]
                    parts = line.split()
                    if len(parts) >= 2:
                        col_name_original = parts[0]  # Preserve original casing for display name
                        col_name = parts[0].upper()   # Uppercase for DB reference
                        # Get the FULL data type including parameters - HANDLE IDENTITY!
                        col_type_match = re.match(r'(\w+(?:\([^)]+\))?)', parts[1])
                        col_type = col_type_match.group(1).upper() if col_type_match else parts[1].upper()
                        
                        columns.append({
                            'name': col_name,
                            'original_name': col_name_original,  # Keep original for naming style
                            'type': col_type,
                            'nullable': 'NOT NULL' not in line.upper()
                        })
            
            tables[table_name] = columns
        
        print(f"📊 Found {len(tables)} tables and {len(foreign_keys)} foreign keys in DDL")
        return tables, foreign_keys
    
    def create_relationships_separately(self, table_relationships: Dict, table_guids: Dict):
        """Create relationships as separate TML objects after tables exist"""
        for table_name, relationships in table_relationships.items():
            for relationship in relationships:
                # Create relationship TML
                relationship_tml = {
                    'guid': None,
                    'relationship': {
                        'name': relationship['name'],
                        'destination_table': table_guids.get(relationship['to_table']),
                        'source_table': table_guids.get(table_name),
                        'type': relationship['type'],
                        'join_columns': [
                            {
                                'source_column': rel_on['from_column'],
                                'destination_column': rel_on['to_column']
                            }
                            for rel_on in relationship['on']
                        ]
                    }
                }
                
                relationship_yaml = yaml.dump(relationship_tml, default_flow_style=False, sort_keys=False)
                print(f"   🔗 Creating relationship: {relationship['name']}")
                print(f"   📄 Relationship TML:\n{relationship_yaml}")
                
                response = self.session.post(
                    f"{self.base_url}/api/rest/2.0/metadata/tml/import",
                    json={
                        "metadata_tmls": [relationship_yaml],
                        "import_policy": "ALL_OR_NONE",
                        "create_new": True
                    }
                )
                
                if response.status_code == 200:
                    result = response.json()
                    print(f"   📋 Relationship response: {result}")
                    if result[0].get('response', {}).get('status', {}).get('status_code') == 'OK':
                        print(f"   ✅ Relationship created: {relationship['name']}")
                    else:
                        error_msg = result[0].get('response', {}).get('status', {}).get('error_message', 'Unknown error')
                        print(f"   ❌ Relationship failed: {error_msg}")
                else:
                    print(f"   ❌ Relationship API call failed: {response.status_code}")
                    print(f"   📋 Response: {response.text}")

    def create_table_tml(self, table_name: str, columns: List, connection_name: str,
                        database: str, schema: str, all_tables: Dict = None, table_guid: str = None, foreign_keys: List = None) -> str:
        """Generate table TML matching working example structure

        Args:
            table_guid: If provided, use this GUID (for updating existing tables with joins)
            foreign_keys: List of foreign key relationships parsed from DDL
        """
        tml_columns = []
        
        # Generate columns with proper typing
        for col in columns:
            ts_type = self._map_data_type(col['type'])
            col_name = col['name'].upper()
            
            # Determine column type - IDs are measures in table TML but not model TML
            if ts_type in ['INT64'] and col_name.endswith('ID'):
                col_type = 'MEASURE'
                properties = {
                    'column_type': col_type,
                    'aggregation': 'SUM',
                    'index_type': 'DONT_INDEX'
                }
            elif ts_type in ['DOUBLE', 'INT64'] and not col_name.endswith('ID'):
                col_type = 'MEASURE'
                properties = {
                    'column_type': col_type,
                    'aggregation': 'SUM',
                    'index_type': 'DONT_INDEX'
                }
            else:
                col_type = 'ATTRIBUTE'
                properties = {
                    'column_type': col_type,
                    'index_type': 'DONT_INDEX'
                }
            
            column_def = {
                'name': col['name'].upper(),
                'db_column_name': col['name'].upper(),
                'properties': properties,
                'db_column_properties': {
                    'data_type': ts_type
                }
            }
                
            tml_columns.append(column_def)
        
        table_tml = {
            'guid': table_guid,  # Use provided GUID or None for new tables
            'table': {
                'name': table_name.upper(),
                'db': database,
                'schema': schema,
                'db_table': table_name.upper(),
                'connection': {
                    'name': connection_name
                },
                'columns': tml_columns,
                'properties': {
                    'sage_config': {
                        'is_sage_enabled': False
                    }
                }
            }
        }
        
        # Add joins_with relationships (matching working example)
        if all_tables:
            joins_with = self._generate_table_joins(table_name, columns, all_tables, foreign_keys)
            if joins_with:
                table_tml['table']['joins_with'] = joins_with
        
        # Generate YAML with proper formatting
        yaml_output = yaml.dump(table_tml, default_flow_style=False, sort_keys=False)
        # Keep quotes around 'on' key as shown in working example
        return yaml_output
    
    def _generate_table_joins(self, table_name: str, columns: List, all_tables: Dict, foreign_keys: List = None) -> List:
        """Generate joins_with structure based on parsed foreign keys from DDL"""
        joins = []
        table_name_upper = table_name.upper()
        
        if not foreign_keys:
            print(f"   ⚠️  No foreign keys provided for {table_name_upper}")
            return joins
        
        # Use actual foreign keys from DDL
        for fk in foreign_keys:
            if fk['from_table'] == table_name_upper:
                to_table = fk['to_table']
                from_col = fk['from_column']
                to_col = fk['to_column']
                
                # Skip self-joins (e.g., EMPLOYEES.MANAGER_ID -> EMPLOYEES.EMPLOYEE_ID)
                # ThoughtSpot models don't handle self-referential joins well (causes cycles)
                if to_table == table_name_upper:
                    print(f"   ⏭️  Skipping self-join: {table_name_upper}.{from_col} -> {to_table}.{to_col} (self-referential)")
                    continue

                # Check if target table exists in THIS deployment
                available_tables_upper = [t.upper() for t in all_tables.keys()]
                if to_table in available_tables_upper:
                    constraint_id = f"SYS_CONSTRAINT_{self._generate_constraint_id()}"
                    join_def = {
                        'name': constraint_id,
                        'destination': {
                            'name': to_table
                        },
                        'on': f"[{table_name_upper}::{from_col}] = [{to_table}::{to_col}]",
                        'type': 'INNER'
                    }
                    joins.append(join_def)
                    print(f"   🔗 Generated join: {table_name_upper}.{from_col} -> {to_table}.{to_col}")
                else:
                    print(f"   ⏭️  Skipping join: {table_name_upper}.{from_col} -> {to_table} (table not in this deployment)")
        
        return joins

    def create_connection_tml(self, connection_name: str) -> str:
        """Generate connection TML matching working example"""
        connection_tml = {
            'guid': None,  # Will be generated by ThoughtSpot
            'connection': {
                'name': connection_name,
                'type': 'RDBMS_SNOWFLAKE',
                'authentication_type': 'KEY_PAIR',
                'properties': [
                    {'key': 'accountName', 'value': self.sf_account},
                    {'key': 'user', 'value': self.sf_user},
                    {'key': 'private_key', 'value': self._get_private_key_for_thoughtspot()},
                    {'key': 'passphrase', 'value': get_admin_setting('SNOWFLAKE_KP_PASSPHRASE', required=False)},
                    {'key': 'role', 'value': self.sf_role},
                    {'key': 'warehouse', 'value': self.sf_warehouse}
                ],
                'description': f'Auto-generated Snowflake connection for {connection_name}'
            }
        }
        
        yaml_output = yaml.dump(connection_tml, default_flow_style=False, sort_keys=False)
        return yaml_output

    def create_actual_model_tml(self, tables: Dict, foreign_keys: List, table_guids: Dict = None, 
                               model_name: str = None, connection_name: str = None) -> str:
        """Generate proper model TML matching boone_test5 working example"""
        if not model_name:
            model_name = f"demo_model_{datetime.now().strftime('%Y%m%d')}"
        
        if not connection_name:
            connection_name = model_name
        
        # Create model structure matching working example exactly
        model = {
            'guid': None,  # Will be generated by ThoughtSpot
            'model': {
                'name': model_name,
                'model_tables': [],
                'columns': [],
                'properties': {
                    'is_bypass_rls': False,
                    'join_progressive': True,
                    'spotter_config': {
                        'is_spotter_enabled': True
                    }
                }
            }
        }
        
        # Build column name conflict resolution
        column_name_counts = {}
        for table_name, columns in tables.items():
            for col in columns:
                col_name = col['name'].upper()
                if col_name not in column_name_counts:
                    column_name_counts[col_name] = []
                column_name_counts[col_name].append(table_name.upper())
        
        # Add model_tables - START WITH NO JOINS for now (we can add them later)
        print("   📋 Creating model without explicit joins (ThoughtSpot can auto-detect)")
        
        for table_name in tables.keys():
            table_name_upper = table_name.upper()
            table_guid = table_guids.get(table_name_upper) if table_guids else None
            
            # Use FQN to resolve "multiple data sources with same name" issue
            # ThoughtSpot explicitly requires this when there are duplicate table names
            table_entry = {
                'name': table_name_upper,
                'fqn': table_guid  # Required to uniquely identify which table to use
            }
            
            # For now, don't add explicit joins - let ThoughtSpot auto-detect
            # This matches the pattern where some tables in your working example don't have joins
                    
            model['model']['model_tables'].append(table_entry)
        
        # Remove diamond join paths - ThoughtSpot rejects models where
        # table A joins to B, A joins to C, and C also joins to B
        self._remove_diamond_joins(model['model']['model_tables'])
        
        # Add columns with proper global conflict resolution
        used_display_names = set()  # Track used names globally across all columns
        
        for table_name, columns in tables.items():
            table_name_upper = table_name.upper()
            for col in columns:
                col_name = col['name'].upper()
                original_col_name = col.get('original_name', col['name'])  # Use original casing for display
                
                # TODO: Later we can exclude ID columns for cleaner model
                # For now, include all columns to get the basic model working
                
                # Start with basic conflict resolution
                display_name = self._resolve_column_name_conflict(
                    col_name, table_name_upper, column_name_counts,
                    original_name=original_col_name
                )
                
                # If the display name is still used, make it unique with table prefixes
                original_display_name = display_name
                counter = 1
                while display_name.lower() in used_display_names:
                    # Use table prefix for all tables consistently
                    if counter == 1:
                        # Generate consistent short prefix from table name
                        if len(table_name_upper) <= 4:
                            prefix = table_name_upper.lower()
                        else:
                            prefix = table_name_upper[:4].lower()
                        # Use snake_case: prefix_name
                        display_name = f"{prefix}_{original_display_name}"
                    else:
                        # Fallback: add number
                        display_name = f"{original_display_name}_{counter}"
                    counter += 1
                
                used_display_names.add(display_name.lower())
                
                # Determine column type based on data type
                col_type, aggregation = self._determine_column_type(col['type'], col_name)
                
                column_def = {
                    'name': display_name,
                    'column_id': f"{table_name_upper}::{col_name}",
                    'properties': {
                        'column_type': col_type,
                        'index_type': 'DONT_INDEX'
                    }
                }
                
                # Add aggregation for measures
                if aggregation:
                    column_def['properties']['aggregation'] = aggregation

                # Add calendar property for DATE columns so ThoughtSpot enables
                # time bucketing (.weekly, .monthly, etc.) on them
                if self._map_data_type(col['type']) == 'DATE':
                    column_def['properties']['calendar'] = 'calendar'

                model['model']['columns'].append(column_def)

        # Generate YAML output with proper formatting
        yaml_output = yaml.dump(model, default_flow_style=False, sort_keys=False,
                               default_style=None, indent=2, width=120)
        
        # Validate the generated YAML
        try:
            # Test if the YAML can be parsed back
            yaml.safe_load(yaml_output)
            print("   ✅ Generated YAML is valid")
        except yaml.YAMLError as e:
            print(f"   ❌ Generated YAML is invalid: {e}")
            print("   📄 Invalid YAML:")
            print(yaml_output)
            raise ValueError(f"Generated invalid YAML: {e}")
        
        return yaml_output

    def _is_foreign_key_column(self, col_name: str, table_name: str, foreign_keys: List) -> bool:
        """Check if column is a foreign key (used only for joins, not analytics)"""
        for fk in foreign_keys:
            if (fk.get('source_table', '').upper() == table_name and
                fk.get('source_column', '').upper() == col_name):
                return True
        return False

    def _is_surrogate_primary_key(self, col: Dict, col_name: str) -> bool:
        """Check if column is a meaningless surrogate key (numeric ID)"""
        # Common patterns: ID, _ID, ID_, ends with 'id'
        if col_name.upper().endswith('ID'):
            # Check if it's numeric (INT, BIGINT, NUMBER)
            col_type = col.get('type', '').upper()
            if any(t in col_type for t in ['INT', 'NUMBER', 'NUMERIC', 'BIGINT']):
                return True
        return False

    def _create_model_with_constraints(self, tables: Dict, foreign_keys: List, table_guids: Dict,
                                     table_constraints: Dict, model_name: str, connection_name: str) -> str:
        """Generate model TML with constraint references like our successful test"""
        print("   📋 Creating model with constraint references")
        
        # Build column name conflict tracking
        column_name_counts = {}
        for table_name, columns in tables.items():
            for col in columns:
                col_name = col['name'].upper()
                if col_name not in column_name_counts:
                    column_name_counts[col_name] = []
                column_name_counts[col_name].append(table_name.upper())
        
        model = {
            'guid': None,
            'model': {
                'name': model_name,
                'model_tables': [],
                'columns': [],
                'properties': {
                    'is_bypass_rls': False,
                    'join_progressive': True,
                    'spotter_config': {
                        'is_spotter_enabled': True
                    }
                }
            }
        }

        # Add model_tables with FQNs and constraint-based joins
        for table_name in tables.keys():
            table_name_upper = table_name.upper()
            table_guid = table_guids.get(table_name_upper)
            
            table_entry = {
                'name': table_name_upper,
                'fqn': table_guid
            }
            
            # Build joins from foreign_keys list (more reliable than constraint extraction)
            table_joins = []
            for fk in foreign_keys:
                if fk['from_table'].upper() == table_name_upper:
                    to_table = fk['to_table'].upper()
                    
                    # Skip self-joins (e.g., EMPLOYEES.MANAGER_ID -> EMPLOYEES.EMPLOYEE_ID)
                    # ThoughtSpot models don't handle self-referential joins well (causes cycles)
                    if to_table == table_name_upper:
                        print(f"   ⏭️  Skipping self-join in model: {table_name_upper}.{fk['from_column']} -> {to_table}")
                        continue
                    
                    # Check if target table exists in this deployment
                    if to_table in [t.upper() for t in tables.keys()]:
                        # ThoughtSpot on clause format: [SOURCE::COL] = [DEST::COL]
                        from_col = fk['from_column'].upper()
                        to_col = fk['to_column'].upper()
                        on_clause = f"[{table_name_upper}::{from_col}] = [{to_table}::{to_col}]"
                        
                        join_entry = {
                            'with': to_table,
                            'on': on_clause,
                            'type': 'LEFT_OUTER',
                            'cardinality': 'MANY_TO_ONE'  # Fact to dimension is many-to-one
                        }
                        table_joins.append(join_entry)
                        print(f"   🔗 Added join: {table_name_upper}.{from_col} -> {to_table}.{to_col}")
            
            if table_joins:
                table_entry['joins'] = table_joins
            
            model['model']['model_tables'].append(table_entry)
        
        # Remove diamond join paths - ThoughtSpot rejects models where
        # table A joins to B, A joins to C, and C also joins to B
        self._remove_diamond_joins(model['model']['model_tables'])
        
        # Add columns with proper global conflict resolution (same as working version)
        used_display_names = set()
        
        for table_name, columns in tables.items():
            table_name_upper = table_name.upper()
            for col in columns:
                col_name = col['name'].upper()
                original_col_name = col.get('original_name', col['name'])  # Use original casing for display

                # NOTE: We used to skip FK/PK columns, but ThoughtSpot requires them for joins
                # Even though users don't search "customer 23455", the join columns must be present
                # in the model's columns section for the joins to work properly.
                #
                # SKIP foreign key columns - they're join keys, not analytics columns
                # if self._is_foreign_key_column(col_name, table_name_upper, foreign_keys):
                #     print(f"   ⏭️  Skipping FK column: {table_name_upper}.{col_name}")
                #     continue
                #
                # SKIP surrogate primary keys (numeric IDs) - nobody searches "customer 23455"
                # if self._is_surrogate_primary_key(col, col_name):
                #     print(f"   ⏭️  Skipping surrogate PK: {table_name_upper}.{col_name}")
                #     continue

                # Start with basic conflict resolution
                display_name = self._resolve_column_name_conflict(
                    col_name, table_name_upper, column_name_counts,
                    original_name=original_col_name
                )
                
                # If the display name is still used, make it unique with table prefixes
                original_display_name = display_name
                counter = 1
                while display_name.lower() in used_display_names:
                    # Use snake_case: prefix_name
                    if counter == 1:
                        if table_name_upper == 'CUSTOMERS':
                            display_name = f"cust_{original_display_name}"
                        elif table_name_upper == 'PRODUCTS':
                            display_name = f"prod_{original_display_name}"
                        elif table_name_upper == 'ORDERS':
                            display_name = f"order_{original_display_name}"
                        elif table_name_upper == 'ORDERITEMS':
                            display_name = f"item_{original_display_name}"
                        elif table_name_upper == 'SALES':
                            display_name = f"sale_{original_display_name}"
                        elif table_name_upper == 'SALESREPS':
                            display_name = f"rep_{original_display_name}"
                        else:
                            display_name = f"{table_name_upper[:4].lower()}_{original_display_name}"
                    else:
                        display_name = f"{original_display_name}_{counter}"
                    counter += 1
                
                used_display_names.add(display_name.lower())
                
                # Determine column type based on data type
                col_type, aggregation = self._determine_column_type(col['type'], col_name)
                
                column_def = {
                    'name': display_name,
                    'column_id': f"{table_name_upper}::{col_name}",
                    'properties': {
                        'column_type': col_type,
                        'index_type': 'DONT_INDEX'
                    }
                }

                if aggregation:
                    column_def['properties']['aggregation'] = aggregation

                # Add calendar property for DATE columns so ThoughtSpot enables
                # time bucketing (.weekly, .monthly, etc.) on them
                if self._map_data_type(col['type']) == 'DATE':
                    column_def['properties']['calendar'] = 'calendar'

                model['model']['columns'].append(column_def)

        # Generate YAML output with validation
        yaml_output = yaml.dump(model, default_flow_style=False, sort_keys=False,
                               default_style=None, indent=2, width=120)

        # Fix YAML reserved word quoting - 'on' gets quoted because it's a YAML boolean
        # ThoughtSpot needs it unquoted
        yaml_output = yaml_output.replace("'on':", "on:")
        
        # Validate the generated YAML
        try:
            yaml.safe_load(yaml_output)
            print("   ✅ Generated YAML is valid")
        except yaml.YAMLError as e:
            print(f"   ❌ Generated YAML is invalid: {e}")
            raise ValueError(f"Generated invalid YAML: {e}")
        
        return yaml_output
    
    def _remove_diamond_joins(self, model_tables: list):
        """Remove join cycles that ThoughtSpot rejects using a spanning tree.
        
        ThoughtSpot requires exactly ONE path between any two tables in a model.
        Uses Kruskal's algorithm: add edges from highest-priority (fact) tables first,
        skip any edge that would create a cycle. Priority order ensures fact table
        joins are preserved and dimension-to-dimension "snowflake" joins are pruned.
        """
        def edge_key(src_name: str, join_def: dict):
            return (
                src_name,
                join_def.get('with'),
                join_def.get('on', ''),
                join_def.get('type', ''),
                join_def.get('cardinality', ''),
            )

        all_edges = []
        for t in model_tables:
            src_name = t['name']
            for j in t.get('joins', []):
                all_edges.append((src_name, j.get('with'), j, edge_key(src_name, j)))
        
        if not all_edges:
            print(f"   ✅ No joins to check for cycles")
            return
        
        out_degree = {}
        for t in model_tables:
            out_degree[t['name']] = len(t.get('joins', []))
        
        in_degree = {t['name']: 0 for t in model_tables}
        for src, dst, _, _ in all_edges:
            in_degree[dst] = in_degree.get(dst, 0) + 1
        
        all_edges.sort(key=lambda e: (-out_degree.get(e[0], 0), -in_degree.get(e[1], 0), e[0], e[1]))
        
        parent = {t['name']: t['name'] for t in model_tables}
        def find(x):
            while parent[x] != x:
                parent[x] = parent[parent[x]]
                x = parent[x]
            return x
        def union(a, b):
            ra, rb = find(a), find(b)
            if ra == rb:
                return False
            parent[ra] = rb
            return True
        
        kept_edge_keys = set()
        removed = []
        for src, dst, join_def, e_key in all_edges:
            if union(src, dst):
                kept_edge_keys.add(e_key)
            else:
                removed.append(f"{src}->{dst} ({join_def.get('on', '')})")
        
        for t in model_tables:
            if 'joins' not in t:
                continue
            src_name = t['name']
            t['joins'] = [j for j in t['joins'] if edge_key(src_name, j) in kept_edge_keys]
        
        for t in model_tables:
            if 'joins' in t and not t['joins']:
                del t['joins']
        
        if removed:
            print(f"   🔶 Removed {len(removed)} redundant joins (cycle prevention):")
            for r in removed:
                print(f"      - {r}")
        else:
            print(f"   ✅ No join cycles detected")
    
    def _generate_constraint_id(self) -> str:
        """Generate a constraint ID similar to ThoughtSpot's system constraints"""
        import uuid
        return str(uuid.uuid4())

    def validate_foreign_key_references(self, tables: Dict, foreign_keys: List = None) -> List[str]:
        """
        Validate that foreign key columns reference tables that exist in the schema.
        Uses explicit FK constraints from DDL - not heuristics.

        Args:
            tables: Dictionary of table definitions
            foreign_keys: List of FK relationships parsed from DDL
                         Each FK is: {'from_table': str, 'from_column': str, 
                                      'to_table': str, 'to_column': str}

        Returns:
            List of warning messages about missing referenced tables
        """
        warnings = []
        
        if not foreign_keys:
            return warnings  # No explicit FKs defined, nothing to validate
        
        table_names_upper = [t.upper() for t in tables.keys()]

        for fk in foreign_keys:
            target_table = fk.get('to_table', '').upper()
            from_table = fk.get('from_table', '')
            from_column = fk.get('from_column', '')
            
            # Check if the target table exists in this schema
            if target_table and target_table not in table_names_upper:
                warnings.append(
                    f"⚠️  {from_table}.{from_column} references {fk.get('to_table')}, "
                    f"but {fk.get('to_table')} is not in this schema. "
                    f"The join will be skipped during deployment."
                )

        return warnings
    
    def _resolve_column_name_conflict(self, col_name: str, table_name: str, 
                                     column_name_counts: Dict,
                                     original_name: str = None) -> str:
        """
        Resolve column name conflicts using configured naming style and prefixes.
        
        Examples (snake_case):
            SHIPPING_MODE → shipping_mode
            DAYS_TO_SHIP → days_to_ship  
            ORDER_DATE (conflict) → order_order_date, cust_order_date, etc.
        
        Args:
            col_name: Uppercase column name (for conflict detection)
            table_name: Table name for prefix generation
            column_name_counts: Dict tracking column name occurrences
            original_name: Original casing of column name (for proper camelCase detection)
        """
        # Use original name if provided (preserves camelCase boundaries)
        name_for_styling = original_name if original_name else col_name
        
        # Apply configured naming style
        styled_name = _apply_naming_style(name_for_styling, self.column_naming_style)
        
        if len(column_name_counts.get(col_name, [])) <= 1:
            # No conflict - use styled name directly
            return styled_name
        
        # For conflicts, generate prefix dynamically from table name
        if len(table_name) <= 4:
            prefix = table_name.lower()
        elif 'sales' in table_name.lower() and 'rep' in table_name.lower():
            prefix = 'rep'  # Special case for readability
        elif 'customer' in table_name.lower():
            prefix = 'cust'  # Common abbreviation
        elif 'product' in table_name.lower():
            prefix = 'prod'  # Common abbreviation
        elif 'order' in table_name.lower():
            prefix = 'order'  # Common abbreviation
        else:
            prefix = table_name[:4].lower()  # First 4 characters
        
        # Apply naming style to prefix + name combination
        prefixed_name = f"{prefix}_{styled_name}" if styled_name else prefix
        return _apply_naming_style(prefixed_name, self.column_naming_style)
    
    def _get_table_prefix(self, table_name: str) -> str:
        """Get appropriate prefix for table to avoid column conflicts"""
        # Generate prefix dynamically based on table name patterns
        table_lower = table_name.lower()

        if 'customer' in table_lower:
            return ''  # Primary table gets no prefix for readability
        elif 'sales' in table_lower and 'rep' in table_lower:
            return 'Rep'
        elif 'sales' in table_lower:
            return 'Sale'
        elif 'order' in table_lower and 'item' in table_lower:
            return 'Item'
        elif 'order' in table_lower:
            return 'Order'
        elif 'product' in table_lower:
            return 'Product'
        else:
            # Use first 3-4 characters as prefix, capitalize first letter
            prefix = table_name[:4] if len(table_name) > 3 else table_name
            return prefix.capitalize()
    
    def _determine_column_type(self, data_type: str, col_name: str) -> tuple:
        """Determine if column should be ATTRIBUTE or MEASURE"""
        base_type = data_type.upper().split('(')[0]
        col_upper = col_name.upper()
        
        # SALEID is special - it's treated as a measure in the working example
        if col_upper == 'SALEID':
            return 'MEASURE', 'SUM'
        
        # Numeric types should be measures (unless they're IDs or keys)
        if base_type in ['NUMBER', 'DECIMAL', 'FLOAT', 'DOUBLE', 'INT', 'INTEGER', 'BIGINT']:
            # Skip ID/KEY columns - they're join keys, not analytics columns
            if col_upper.endswith('ID') or col_upper.endswith('KEY') or col_upper.endswith('_CODE'):
                return 'ATTRIBUTE', None
            
            # All other numeric columns are measures
            # Determine aggregation based on column name patterns
            if any(word in col_upper for word in ['QUANTITY', 'QTY', 'COUNT', 'SOLD']):
                return 'MEASURE', 'SUM'
            elif any(word in col_upper for word in ['PRICE', 'COST', 'REVENUE', 'AMOUNT', 'TOTAL', 'PROFIT', 'DISCOUNT', 'SHIPPING', 'TAX']):
                return 'MEASURE', 'SUM'
            elif any(word in col_upper for word in ['RATING', 'SCORE', 'MARGIN', 'PERCENT', 'RATE']):
                return 'MEASURE', 'AVERAGE'
            else:
                # Default: numeric = measure with SUM
                return 'MEASURE', 'SUM'
        
        # Everything else is an attribute (strings, dates, booleans, etc.)
        return 'ATTRIBUTE', None
    
    def _build_table_relationships(self, tables: Dict, foreign_keys: List) -> Dict:
        """Build table relationships for joins"""
        relationships = {}
        
        # Auto-detect relationships based on common ID patterns
        table_names = list(tables.keys())
        for table_name in table_names:
            table_name_upper = table_name.upper()
            table_cols = [col['name'].upper() for col in tables[table_name]]
            
            # Find foreign key relationships
            for col_name in table_cols:
                if col_name.endswith('ID') and col_name != f"{table_name_upper}ID":
                    # This looks like a foreign key
                    target_table = col_name[:-2] + 'S'  # CUSTOMERID -> CUSTOMERS
                    if target_table in [t.upper() for t in table_names]:
                        if table_name_upper not in relationships:
                            relationships[table_name_upper] = []
                        relationships[table_name_upper].append({
                            'to_table': target_table,
                            'on_column': col_name
                        })
        
        return relationships
    
    def _create_model_level_joins(self, tables, foreign_keys):
        """Create joins at model level using the format from working example"""
        joins = []
        
        # Auto-detect joins if no explicit foreign keys  
        if len(tables) > 1:
            table_names = list(tables.keys())
            for i, table1 in enumerate(table_names):
                table1_upper = table1.upper()
                table1_cols = [col['name'].upper() for col in tables[table1]]
                
                for j, table2 in enumerate(table_names):
                    if i >= j:  # Avoid duplicates and self-joins
                        continue
                    table2_upper = table2.upper()
                    table2_cols = [col['name'].upper() for col in tables[table2]]
                    
                    # Look for matching ID columns
                    for col1 in table1_cols:
                        if col1.endswith('ID') and col1 in table2_cols:
                            join_entry = {
                                'name': f"{table1_upper.lower()}_{table2_upper.lower()}",
                                'source': table1_upper,
                                'destination': table2_upper,
                                'type': 'INNER',
                                'on': f"{table1_upper}.{col1} = {table2_upper}.{col1}"
                            }
                            joins.append(join_entry)
                            print(f"   🔗 Model-level join: {table1_upper} -> {table2_upper} on {col1}")
                            break
        
        return joins
    
    def _add_joins_to_tables(self, model_tables, tables, foreign_keys):
        """Add joins to individual tables (not as separate section)"""
        # Build join relationships
        table_joins = {}
        
        # Skip joins for now - test basic model creation first
        if False and foreign_keys:
            for fk in foreign_keys:
                from_table = fk['from_table'].upper()
                to_table = fk['to_table'].upper()
                
                if from_table not in table_joins:
                    table_joins[from_table] = []
                
                join_entry = {
                    'with': to_table,
                    'on': f"[{from_table}].[{fk['from_column'].upper()}] = [{to_table}].[{fk['to_column'].upper()}]",
                    'type': 'INNER',
                    'cardinality': 'MANY_TO_ONE'
                }
                table_joins[from_table].append(join_entry)
                print(f"   🔗 Adding join: {from_table} -> {to_table}")
        
        # Skip joins for now - test basic model creation first
        elif False and len(tables) > 1:
            table_names = list(tables.keys())
            for i, table1 in enumerate(table_names):
                table1_upper = table1.upper()
                table1_cols = [col['name'].upper() for col in tables[table1]]
                
                for j, table2 in enumerate(table_names[i+1:], i+1):
                    table2_upper = table2.upper()
                    table2_cols = [col['name'].upper() for col in tables[table2]]
                    
                    # Look for matching ID columns
                    for col1 in table1_cols:
                        if col1.endswith('ID') and col1 in table2_cols:
                            if table1_upper not in table_joins:
                                table_joins[table1_upper] = []
                            
                            join_entry = {
                                'with': table2_upper,
                                'on': f"[{table1_upper}].[{col1}] = [{table2_upper}].[{col1}]",
                                'type': 'INNER',
                                'cardinality': 'MANY_TO_ONE'
                            }
                            table_joins[table1_upper].append(join_entry)
                            print(f"   🔗 Auto-detected join: {table1_upper} -> {table2_upper} on {col1}")
                            break
        
        # Apply joins to model_tables
        for table_entry in model_tables:
            table_name = table_entry['name']
            if table_name in table_joins:
                table_entry['joins'] = table_joins[table_name]
    
    def _build_table_relationships(self, tables: Dict, foreign_keys: List) -> Dict:
        """Build relationships for each table based on foreign keys"""
        table_relationships = {}
        
        if foreign_keys:
            for fk in foreign_keys:
                from_table = fk['from_table'].upper()
                to_table = fk['to_table'].upper()
                from_column = fk['from_column'].upper()
                to_column = fk['to_column'].upper()
                
                # Add relationship to the from_table
                if from_table not in table_relationships:
                    table_relationships[from_table] = []
                
                relationship = {
                    'name': f"{from_table}_{to_table}_{from_column}",
                    'to_table': to_table,
                    'type': 'many_to_one',  # Assuming FK relationships are many-to-one
                    'on': [
                        {
                            'from_column': from_column,
                            'to_column': to_column
                        }
                    ]
                }
                table_relationships[from_table].append(relationship)
                print(f"   🔗 Relationship: {from_table}.{from_column} -> {to_table}.{to_column}")
        
        # Auto-detect relationships if no explicit foreign keys
        elif len(tables) > 1:
            table_names = list(tables.keys())
            for i, table1 in enumerate(table_names):
                table1_upper = table1.upper()
                table1_cols = [col['name'].upper() for col in tables[table1]]
                
                for j, table2 in enumerate(table_names[i+1:], i+1):
                    table2_upper = table2.upper()
                    table2_cols = [col['name'].upper() for col in tables[table2]]
                    
                    # Look for matching ID columns
                    for col1 in table1_cols:
                        if col1.endswith('ID') and col1 in table2_cols:
                            if table1_upper not in table_relationships:
                                table_relationships[table1_upper] = []
                            
                            relationship = {
                                'name': f"{table1_upper}_{table2_upper}_{col1}",
                                'to_table': table2_upper,
                                'type': 'many_to_one',
                                'on': [
                                    {
                                        'from_column': col1,
                                        'to_column': col1
                                    }
                                ]
                            }
                            table_relationships[table1_upper].append(relationship)
                            print(f"   🔗 Auto-detected relationship: {table1_upper}.{col1} -> {table2_upper}.{col1}")
                            break
        
        return table_relationships

    def create_model_tml(self, tables: Dict, foreign_keys: List, table_guids: Dict = None, 
                        model_name: str = None) -> str:
        """Generate worksheet TML (ORIGINAL APPROACH - keeping for comparison)"""
        if not model_name:
            model_name = f"demo_worksheet_{datetime.now().strftime('%Y%m%d')}"
        
        worksheet = {
            'guid': None,
            'worksheet': {
                'name': model_name,
                'description': 'Auto-generated worksheet from DDL',
                'tables': [],  
                'worksheet_columns': [],  # Adding back - but with GUID references
                'properties': {
                    'is_bypass_rls': False,
                    'join_progressive': True,
                    'spotter_config': {
                        'is_spotter_enabled': True
                    }
                }
            }
        }
        
        # Add tables with joins
        for table_name in tables.keys():
            table_entry = {'name': table_name.upper()}
            
            # Add FQN (GUID) if available to resolve multiple tables with same name
            if table_guids and table_name.upper() in table_guids:
                table_entry['fqn'] = table_guids[table_name.upper()]
            
            joins = []
            for fk in foreign_keys:
                if fk['source_table'] == table_name:
                    joins.append({
                        'with': fk['target_table'].upper(),
                        'referencing_join': f"FK_{table_name.upper()}_{fk['target_table'].upper()}"
                    })
            
            if joins:
                table_entry['joins'] = joins
            
            # Just populate the required 'tables' field with GUID reference
            worksheet['worksheet']['tables'].append({
                'name': table_name.upper(),
                'fqn': table_guids.get(table_name.upper()) if table_guids else f"table_{table_name.lower()}"
            })
        
        # Add columns using table GUIDs in expressions
        for table_name, columns in tables.items():
            table_guid = table_guids.get(table_name.upper()) if table_guids else None
            
            for col in columns:
                col_type = 'MEASURE' if 'DECIMAL' in col['type'] else 'ATTRIBUTE'
                
                # Use GUID in expression if available
                if table_guid:
                    expr = f"[{table_guid}].[{col['name']}]"
                else:
                    expr = f"[{table_name.upper()}].[{col['name']}]"
                
                column_def = {
                    'name': col['name'].upper(),
                    'data_type': col_type,
                    'expr': expr
                }
                
                worksheet['worksheet']['worksheet_columns'].append(column_def)
        
        return yaml.dump(worksheet, default_flow_style=False, sort_keys=False)

    def _map_data_type(self, sql_type: str) -> str:
        """Map SQL data types to ThoughtSpot types"""
        sql_type = sql_type.upper()
        
        # DEBUG: Print what we're mapping (commented out for cleaner output)
        # print(f"   🔍 Mapping data type: '{sql_type}'")
        
        # Handle NUMBER with precision/scale intelligently
        if sql_type.startswith('NUMBER'):
            # Extract precision and scale from NUMBER(precision,scale)
            if '(' in sql_type and ')' in sql_type:
                params = sql_type[sql_type.find('(')+1:sql_type.find(')')].split(',')
                if len(params) >= 2:
                    scale = int(params[1].strip())
                    result = 'INT64' if scale == 0 else 'DOUBLE'
                    # print(f"      → NUMBER({params[0].strip()},{scale}) → {result}")
                    return result
                else:
                    # print(f"      → NUMBER({params[0].strip()}) → INT64")
                    return 'INT64'  # NUMBER(x) defaults to integer
            else:
                # print(f"      → Plain NUMBER → DOUBLE")
                return 'DOUBLE'  # Plain NUMBER defaults to double
        
        type_mapping = {
            'INT64': 'INT64',
            'INT': 'INT64',      # FIXED: INT should map to INT64
            'INTEGER': 'INT64', 
            'BIGINT': 'INT64',
            'VARCHAR': 'VARCHAR',
            'TEXT': 'VARCHAR',
            'STRING': 'VARCHAR',
            'DATE': 'DATE',
            'TIMESTAMP': 'DATE',  # Try DATE for TIMESTAMP - DATE fields worked fine
            'TIMESTAMP_NTZ': 'DATE',  # Try DATE for TIMESTAMP_NTZ - we know DATE works
            'DECIMAL': 'DOUBLE',
            'FLOAT': 'DOUBLE',
            'BOOLEAN': 'BOOL'
        }
        
        for sql_key, ts_type in type_mapping.items():
            if sql_key in sql_type:
                return ts_type
                
        return 'VARCHAR'  # Default fallback

    def get_connection_by_name(self, connection_name: str) -> Dict:
        """Check if a connection with this name already exists"""
        try:
            response = self.session.get(
                f"{self.base_url}/api/rest/2.0/metadata/search",
                params={
                    "metadata": [{"type": "DATA_SOURCE", "identifier": connection_name}],
                    "record_size": 10
                }
            )
            
            if response.status_code == 200:
                data = response.json()
                if data and len(data) > 0:
                    return data[0]  # Return first matching connection
            return None
        except Exception as e:
            print(f"   ⚠️  Could not check existing connections: {e}")
            return None

    def create_snowflake_schema(self, database: str, schema: str):
        """Create schema in Snowflake via ThoughtSpot connection"""
        try:
            print(f"   🏗️  Creating schema {database}.{schema}...")
            
            # Use ThoughtSpot's SQL execution API to create schema
            create_schema_sql = f"CREATE SCHEMA IF NOT EXISTS {database}.{schema}"
            
            response = self.session.post(
                f"{self.base_url}/api/rest/2.0/database/executeQuery",
                json={
                    "sql_query": create_schema_sql,
                    "connection_guid": self.sf_connection_guid if hasattr(self, 'sf_connection_guid') else None
                }
            )
            
            if response.status_code == 200:
                print(f"   ✅ Schema {database}.{schema} created/verified")
            else:
                print(f"   ⚠️  Schema creation response: {response.status_code} - {response.text}")
                print(f"   📝 Will proceed assuming schema exists or will be created by table operations")
                
        except Exception as e:
            print(f"   ⚠️  Could not create schema: {e}")
            print(f"   📝 Will proceed assuming schema exists or will be created by table operations")

    def ensure_tag_exists(self, tag_name: str) -> bool:
        """
        Check if a tag exists, create it if it doesn't.
        
        Args:
            tag_name: Name of the tag
            
        Returns:
            True if tag exists or was created, False on error
        """
        if not tag_name:
            # No tag name provided - skip silently
            return True
            
        try:
            # First, try to get the tag to see if it exists
            print(f"[ThoughtSpot]    🔍 Checking if tag '{tag_name}' exists...", flush=True)
            search_response = self.session.post(
                f"{self.base_url}/api/rest/2.0/tags/search",
                json={"tag_identifier": tag_name}
            )
            
            print(f"[ThoughtSpot]    🔍 Tag search response: {search_response.status_code}", flush=True)
            
            if search_response.status_code == 200:
                tags = search_response.json()
                print(f"[ThoughtSpot]    🔍 Tags found: {len(tags) if tags else 0}", flush=True)
                if tags and len(tags) > 0:
                    # Tag exists
                    tag_id = tags[0].get('id', 'unknown')
                    print(f"[ThoughtSpot]    ✅ Tag '{tag_name}' exists (ID: {tag_id})", flush=True)
                    return True
            elif search_response.status_code == 400:
                # 400 might mean tag not found in some ThoughtSpot versions
                print(f"[ThoughtSpot]    🔍 Tag search returned 400 - tag likely doesn't exist", flush=True)
            else:
                print(f"[ThoughtSpot]    ⚠️  Tag search error: {search_response.status_code}", flush=True)
                try:
                    print(f"[ThoughtSpot]    ⚠️  Response: {search_response.text[:200]}", flush=True)
                except:
                    pass
            
            # Tag doesn't exist - create it
            print(f"[ThoughtSpot]    📎 Creating tag '{tag_name}'...", flush=True)
            create_response = self.session.post(
                f"{self.base_url}/api/rest/2.0/tags/create",
                json={"name": tag_name}
            )
            
            print(f"[ThoughtSpot]    📎 Create tag response: {create_response.status_code}", flush=True)
            
            if create_response.status_code in [200, 201]:
                try:
                    result = create_response.json()
                    tag_id = result.get('id', 'unknown')
                    print(f"[ThoughtSpot]    ✅ Tag '{tag_name}' created (ID: {tag_id})", flush=True)
                except:
                    print(f"[ThoughtSpot]    ✅ Tag '{tag_name}' created", flush=True)
                return True
            else:
                print(f"[ThoughtSpot]    ⚠️  Could not create tag: {create_response.status_code}", flush=True)
                try:
                    print(f"[ThoughtSpot]    ⚠️  Response: {create_response.text[:200]}", flush=True)
                except:
                    pass
                # Return False - don't silently proceed
                return False
                
        except Exception as e:
            import traceback
            print(f"[ThoughtSpot]    ⚠️  Tag check/create error: {str(e)}", flush=True)
            print(f"[ThoughtSpot]    ⚠️  Traceback: {traceback.format_exc()}", flush=True)
            return False

    def assign_tags_to_objects(self, object_guids: List[str], object_type: str, tag_name: str) -> bool:
        """
        Assign tags to ThoughtSpot objects using REST API v1.
        Auto-creates the tag if it doesn't exist.
        
        Args:
            object_guids: List of object GUIDs to tag
            object_type: Type of objects (LOGICAL_TABLE for tables/models, PINBOARD_ANSWER_BOOK for liveboards)
            tag_name: Tag name to assign
            
        Returns:
            True if successful, False otherwise
        """
        if not tag_name:
            # No tag name provided - skip silently (this is expected behavior)
            return True
        if not object_guids:
            return False
        
        try:
            import json as json_module
            
            # Ensure tag exists (create if needed)
            tag_ready = self.ensure_tag_exists(tag_name)
            if not tag_ready:
                print(f"[ThoughtSpot]    ⚠️  Could not ensure tag exists, skipping assignment", flush=True)
                return False
            
            # Use V1 API which actually works
            assign_response = self.session.post(
                f"{self.base_url}/tspublic/v1/metadata/assigntag",
                data={
                    'id': json_module.dumps(object_guids),
                    'type': object_type,
                    'tagname': json_module.dumps([tag_name])
                },
                headers={
                    'X-Requested-By': 'ThoughtSpot',
                    'Content-Type': 'application/x-www-form-urlencoded'
                }
            )
            
            if assign_response.status_code in [200, 204]:
                print(f"[ThoughtSpot]    ✅ Tagged {len(object_guids)} {object_type} objects with '{tag_name}'", flush=True)
                return True
            else:
                print(f"[ThoughtSpot]    ⚠️  Tag assignment failed: {assign_response.status_code}", flush=True)
                print(f"[ThoughtSpot]    DEBUG: Response text: {assign_response.text[:500]}", flush=True)
                print(f"[ThoughtSpot]    DEBUG: Object GUIDs: {object_guids}", flush=True)
                print(f"[ThoughtSpot]    DEBUG: Object type: {object_type}", flush=True)
                return False
                
        except Exception as e:
            print(f"[ThoughtSpot]    ⚠️  Tag assignment error: {str(e)}", flush=True)
            return False

    def share_objects(self, object_guids: List[str], object_type: str, share_with: str) -> bool:
        """
        Share ThoughtSpot objects with a user or group (can_edit / MODIFY).

        Args:
            object_guids: GUIDs to share
            object_type: 'LOGICAL_TABLE' for models/tables, 'LIVEBOARD' for liveboards
            share_with: user email (contains '@') or group name
        """
        if not share_with or not object_guids:
            return True

        principal_type = "USER" if '@' in share_with else "USER_GROUP"

        try:
            response = self.session.post(
                f"{self.base_url}/api/rest/2.0/security/metadata/share",
                json={
                    "permissions": [
                        {
                            "principal": {
                                "identifier": share_with,
                                "type": principal_type
                            },
                            "share_mode": "MODIFY"
                        }
                    ],
                    "metadata": [
                        {"identifier": guid, "type": object_type}
                        for guid in object_guids
                    ]
                }
            )
            if response.status_code in [200, 204]:
                print(f"[ThoughtSpot]    ✅ Shared {len(object_guids)} {object_type} with {principal_type} '{share_with}'", flush=True)
                return True
            else:
                print(f"[ThoughtSpot]    ⚠️  Share failed: {response.status_code} - {response.text[:200]}", flush=True)
                return False
        except Exception as e:
            print(f"[ThoughtSpot]    ⚠️  Share error: {str(e)}", flush=True)
            return False

    def _generate_demo_names(self, company_name: str = None, use_case: str = None):
        """Generate standardized demo names using DM convention"""
        from datetime import datetime
        import re
        
        # Get timestamp components
        now = datetime.now()
        yymmdd = now.strftime('%y%m%d')
        hhmmss = now.strftime('%H%M%S')
        
        # Clean and truncate company name (5 chars)
        if company_name:
            company_clean = re.sub(r'[^a-zA-Z0-9]', '', company_name.upper())[:5]
        else:
            company_clean = 'DEMO'[:5]
        
        # Clean and truncate use case (3 chars) 
        if use_case:
            usecase_clean = re.sub(r'[^a-zA-Z0-9]', '', use_case.upper())[:3]
        else:
            usecase_clean = 'GEN'[:3]
        
        # Generate names
        base_name = f"DM{yymmdd}_{hhmmss}_{company_clean}_{usecase_clean}"
        
        return {
            'schema': base_name,
            'connection': f"{base_name}_conn",
            'model': f"{base_name}_model",
            'base': base_name
        }

    def deploy_all(self, ddl: str, database: str, schema: str, base_name: str,
                  connection_name: str = None, company_name: str = None,
                  use_case: str = None, liveboard_name: str = None,
                  llm_model: str = None, tag_name: str = None,
                  liveboard_method: str = None, share_with: str = None,
                  company_research: str = None,
                  progress_callback=None) -> Dict:
        """
        Deploy complete data model to ThoughtSpot
        
        Args:
            ddl: Data Definition Language statements
            database: Target database name
            schema: Target schema name  
            connection_name: Optional connection name (auto-generated if not provided)
        
        Returns:
            Dict with deployment results and names of created objects
        """
        results = {
            'success': False,
            'connection': None,
            'tables': [],
            'model': None,
            'errors': []
        }
        
        table_guids = {}  # Store table GUIDs for model creation
        
        def log_progress(message):
            """Helper to log progress both to console and callback"""
            # ALWAYS print to console FIRST
            import sys
            print(f"[ThoughtSpot] {message}", flush=True)
            sys.stdout.flush()  # Force flush
            
            # Then call callback if provided
            if progress_callback:
                try:
                    progress_callback(message)
                except Exception as e:
                    print(f"[Warning] Callback error: {e}", flush=True)
        
        try:
            import time
            start_time = time.time()
            
            # STEP 0: Authenticate first!
            log_progress("Authenticating...")
            if not self.authenticate():
                raise Exception("ThoughtSpot authentication failed")
            auth_time = time.time() - start_time
            log_progress(f"[OK] Auth complete ({auth_time:.1f}s)")
            
            # Parse DDL
            tables, foreign_keys = self.parse_ddl(ddl)
            if not tables:
                raise Exception("No tables found in DDL")

            # Validate foreign key references before deployment (uses explicit FKs from DDL)
            fk_warnings = self.validate_foreign_key_references(tables, foreign_keys)
            if fk_warnings:
                log_progress(f"[WARN] {len(fk_warnings)} FK warning(s) - joins to missing tables will be skipped")
                for warning in fk_warnings:
                    log_progress(f"   {warning}")

            # Step 1: Create connection using base name
            # base_name is like "DEMO_AMA_12111207_X4R"
            # schema is like "DEMO_
            # 2111207_X4R_sch"
            
            demo_names = {
                'schema': schema,
                'connection': f"{base_name}_conn",
                'model': f"{base_name}_mdl",
                'base': base_name
            }
            
            if not connection_name:
                connection_name = demo_names['connection']
            
            log_progress(f"Creating connection: {connection_name}...")
            
            # Check if connection already exists first
            existing_connection = self.get_connection_by_name(connection_name)
            if existing_connection:
                connection_guid = existing_connection['header']['id_guid']
                connection_fqn = connection_guid
                results['connection'] = connection_name
                results['connection_guid'] = connection_guid
                log_progress(f"[OK] Connection ready")
                
                # Assign tag to existing connection
                if tag_name and connection_guid:
                    log_progress(f"Assigning tag '{tag_name}' to connection...")
                    self.assign_tags_to_objects([connection_guid], 'DATA_SOURCE', tag_name)
            else:
                log_progress(f"Creating new connection: {connection_name}")
                # base_name already has random suffix (e.g., _UZM) so no need for additional uniqueness
                
                print(f"🔗 Creating connection: {connection_name}")
                print(f"   Account: '{self.sf_account}' (length: {len(self.sf_account)})")
                print(f"   User: '{self.sf_user}'")
                print(f"   Database: '{database}'")
                
                connection_tml_yaml = self.create_connection_tml(connection_name)
                # Filter out sensitive info for display - use regex for private key
                import re
                display_tml = re.sub(r'-----BEGIN ENCRYPTED PRIVATE KEY-----.*?-----END ENCRYPTED PRIVATE KEY-----', '[PRIVATE_KEY_REDACTED]', connection_tml_yaml, flags=re.DOTALL)
                passphrase = get_admin_setting('SNOWFLAKE_KP_PASSPHRASE', required=False)
                if passphrase:
                    display_tml = display_tml.replace(passphrase, "[PASSPHRASE_REDACTED]")
                print(f"\n📄 TML being sent:\n{display_tml}")
                
                # connection_tml_yaml is already a YAML string from create_connection_tml()
                
                response = self.session.post(
                    f"{self.base_url}/api/rest/2.0/metadata/tml/import",
                    json={
                        "metadata_tmls": [connection_tml_yaml],
                        "import_policy": "PARTIAL"
                    }
                )
            
            print(f"   Response status: {response.status_code}")
            if response.status_code != 200:
                # Print the actual error response from ThoughtSpot
                try:
                    error_response = response.json()
                    print(f"❌ Error response: {error_response}")
                except:
                    print(f"❌ Error response (raw): {response.text}")
            
            if response.status_code == 200:
                result = response.json()
                print(f"📋 Connection response: {result}")
                print(f"📋 Response type: {type(result)}")
                
                # Handle both dict and list responses
                if isinstance(result, list):
                    # Response is a list
                    if len(result) > 0 and result[0].get('response', {}).get('status', {}).get('status_code') == 'OK':
                        connection_guid = result[0].get('response', {}).get('header', {}).get('id_guid')
                        print(f"✅ Connection created: {connection_name} (GUID: {connection_guid})")
                        results['connection'] = connection_name
                        results['connection_guid'] = connection_guid
                        # Store connection GUID for table creation
                        connection_fqn = connection_guid
                    else:
                        error_msg = result[0].get('response', {}).get('status', {}).get('error_message', 'Unknown error') if result else 'Empty response'
                        raise Exception(f"Connection creation failed: {error_msg}")
                elif isinstance(result, dict) and result.get('object') and len(result['object']) > 0:
                    obj = result['object'][0]
                    if obj.get('status', {}).get('status_code') == 'OK':
                        connection_guid = obj.get('header', {}).get('id_guid')
                        print(f"✅ Connection created: {connection_name} (GUID: {connection_guid})")
                        results['connection'] = connection_name
                        results['connection_guid'] = connection_guid
                        # Store connection GUID for table creation
                        connection_fqn = connection_guid
                    else:
                        error_msg = obj.get('status', {}).get('error_message', 'Unknown error')
                        raise Exception(f"Connection creation failed: {error_msg}")
                else:
                    raise Exception("Connection creation failed: No object in response")
            else:
                raise Exception(f"Connection creation failed: HTTP {response.status_code}")
            
            # Assign tag to connection
            if tag_name and connection_guid:
                log_progress(f"Assigning tag '{tag_name}' to connection...")
                self.assign_tags_to_objects([connection_guid], 'DATA_SOURCE', tag_name)
            
            # Step 1.5: Schema should already exist (created by demo_prep tool)
            print("\n1️⃣.5 Using existing schema in Snowflake...")
            
            # Step 2: Build relationships for tables
            print("\n1️⃣.5 Building relationships...")
            table_relationships = self._build_table_relationships(tables, foreign_keys)

            # Step 2: TWO-PHASE TABLE CREATION (to avoid dependency order issues)
            table_count = len(tables)
            batch1_start = time.time()
            log_progress(f"Batch 1/2: Creating {table_count} tables...")

            # PHASE 1: Create all tables WITHOUT joins in ONE batch API call
            # Build array of all table TMLs
            table_tmls_batch1 = []
            table_names_order = []  # Track order for matching response
            
            for table_name, columns in tables.items():
                print(f"[ThoughtSpot]    Preparing {table_name.upper()}...", flush=True)
                table_tml = self.create_table_tml(table_name, columns, connection_name, database, schema, all_tables=None, foreign_keys=foreign_keys)
                table_tmls_batch1.append(table_tml)
                table_names_order.append(table_name.upper())

            # Send all tables in ONE API call
            log_progress(f"   Sending batch request for {len(table_tmls_batch1)} tables...")
            response = self.session.post(
                f"{self.base_url}/api/rest/2.0/metadata/tml/import",
                json={
                    "metadata_tmls": table_tmls_batch1,
                    "import_policy": "PARTIAL",
                    "create_new": True
                }
            )

            if response.status_code == 200:
                result = response.json()

                # Handle both response formats (list or dict with 'object' key)
                if isinstance(result, list):
                    objects = result
                elif isinstance(result, dict) and 'object' in result:
                    objects = result['object']
                else:
                    error = f"Batch 1 failed: Unexpected response format: {type(result)}"
                    log_progress(f"   ❌ {error}")
                    results['errors'].append(error)
                    return results

                # Process each table result
                for idx, obj in enumerate(objects):
                    table_name = table_names_order[idx] if idx < len(table_names_order) else f"TABLE_{idx}"
                    
                    if obj.get('response', {}).get('status', {}).get('status_code') == 'OK':
                        table_guid = obj.get('response', {}).get('header', {}).get('id_guid')
                        print(f"[ThoughtSpot]    ✅ {table_name} created", flush=True)
                        results['tables'].append(table_name)
                        table_guids[table_name] = table_guid
                    else:
                        error_msg = obj.get('response', {}).get('status', {}).get('error_message', 'Unknown error')
                        error = f"Table {table_name} failed: {error_msg}"
                        print(f"[ThoughtSpot]    ❌ {table_name} failed: {error_msg}", flush=True)
                        results['errors'].append(error)
            else:
                error = f"Batch 1 HTTP error: {response.status_code} - {response.text}"
                log_progress(f"   ❌ {error}")
                results['errors'].append(error)
                return results

            # Check if we created any tables successfully
            if not table_guids:
                log_progress("   ❌ No tables were created successfully in Batch 1")
                return results

            # Assign tags to tables
            table_guid_list = list(table_guids.values())
            print(f"🔍 DEBUG BEFORE TAG CALL: tag_name='{tag_name}', table_guid_list={table_guid_list}")
            log_progress(f"Assigning tag '{tag_name}' to {len(table_guid_list)} tables...")
            self.assign_tags_to_objects(table_guid_list, 'LOGICAL_TABLE', tag_name)

            batch1_time = time.time() - batch1_start
            log_progress(f"[OK] Batch 1 complete: {len(table_guids)} tables created ({batch1_time:.1f}s)")

            # PHASE 2: Update tables WITH joins in ONE batch API call
            batch2_start = time.time()
            log_progress(f"Batch 2/2: Adding joins to {len(table_guids)} tables...")
            
            # Build array of all table update TMLs (with joins)
            table_tmls_batch2 = []
            table_names_order_batch2 = []
            
            for table_name, columns in tables.items():
                table_name_upper = table_name.upper()
                
                # Only add joins if the table was created successfully in Phase 1
                if table_name_upper not in table_guids:
                    print(f"[ThoughtSpot]    Skipping {table_name_upper} (not created)", flush=True)
                    continue

                # Get the GUID for this table
                table_guid = table_guids[table_name_upper]

                print(f"[ThoughtSpot]    Preparing joins for {table_name_upper}...", flush=True)
                # Create table TML WITH joins_with section AND the table GUID
                table_tml = self.create_table_tml(
                    table_name, columns, connection_name, database, schema,
                    all_tables=tables, table_guid=table_guid, foreign_keys=foreign_keys
                )
                table_tmls_batch2.append(table_tml)
                table_names_order_batch2.append(table_name_upper)

            # Send all table updates in ONE API call
            if table_tmls_batch2:
                log_progress(f"   Sending batch request to add joins to {len(table_tmls_batch2)} tables...")
                response = self.session.post(
                    f"{self.base_url}/api/rest/2.0/metadata/tml/import",
                    json={
                        "metadata_tmls": table_tmls_batch2,
                        "import_policy": "PARTIAL",
                        "create_new": False  # Update existing tables
                    }
                )

                if response.status_code == 200:
                    result = response.json()

                    # Handle both response formats
                    if isinstance(result, list):
                        objects = result
                    elif isinstance(result, dict) and 'object' in result:
                        objects = result['object']
                    else:
                        objects = []

                    # Process each result
                    for idx, obj in enumerate(objects):
                        table_name = table_names_order_batch2[idx] if idx < len(table_names_order_batch2) else f"TABLE_{idx}"
                        
                        if obj.get('response', {}).get('status', {}).get('status_code') == 'OK':
                            print(f"[ThoughtSpot]    ✅ {table_name} joins added", flush=True)
                        else:
                            error_msg = obj.get('response', {}).get('status', {}).get('error_message', 'Unknown error')
                            print(f"[ThoughtSpot]    ⚠️  {table_name} joins failed: {error_msg}", flush=True)
                            results['errors'].append(f"Joins for {table_name} failed: {error_msg}")
                else:
                    log_progress(f"   ⚠️  Batch 2 HTTP error: {response.status_code}")

            batch2_time = time.time() - batch2_start
            log_progress(f"[OK] Batch 2 complete: Joins added ({batch2_time:.1f}s)")
            actual_constraint_ids = {}  # We'll generate these for the model
            
            # Skip separate relationship creation for now
            # print("\n2️⃣.5 Creating relationships separately...")
            # self.create_relationships_separately(table_relationships, table_guids)
            
            # Step 3: Extract constraint IDs from created tables
            table_constraints = {}
            
            for table_name, table_guid in table_guids.items():
                print(f"[ThoughtSpot]    Extracting joins from {table_name}...", flush=True)
                
                # Export table TML to get constraint IDs
                export_response = self.session.post(
                    f"{self.base_url}/api/rest/2.0/metadata/tml/export",
                    json={
                        "metadata": [{"identifier": table_guid, "type": "LOGICAL_TABLE"}],
                        "export_associated": False,
                        "format_type": "YAML"
                    }
                )
                
                if export_response.status_code == 200:
                    tml_data = export_response.json()
                    if tml_data and 'edoc' in tml_data[0]:
                        import json
                        tml_json = json.loads(tml_data[0]['edoc'])
                        
                        # Extract joins_with constraint IDs
                        joins_with = tml_json.get('table', {}).get('joins_with', [])
                        if joins_with:
                            table_constraints[table_name] = []
                            for join in joins_with:
                                constraint_id = join.get('name')
                                destination = join.get('destination', {}).get('name')
                                if constraint_id and destination:
                                    table_constraints[table_name].append({
                                        'constraint_id': constraint_id,
                                        'destination': destination
                                    })
            
            # Step 4: Create model (semantic layer) with constraint references
            model_start = time.time()
            model_name = demo_names['model']
            log_progress(f"Creating model: {model_name}...")
            
            # Use the enhanced model creation that includes constraint references
            model_tml = self._create_model_with_constraints(tables, foreign_keys, table_guids, table_constraints, model_name, connection_name)
            print(f"\n📄 Model TML being sent:\n{model_tml}")
            
            response = self.session.post(
                f"{self.base_url}/api/rest/2.0/metadata/tml/import",
                json={
                    "metadata_tmls": [model_tml],
                    "import_policy": "ALL_OR_NONE",
                    "create_new": True
                }
            )
            
            if response.status_code == 200:
                result = response.json()

                # Handle both response formats (list or dict with 'object' key)
                if isinstance(result, list):
                    objects = result
                elif isinstance(result, dict) and 'object' in result:
                    objects = result['object']
                else:
                    error = f"Model failed: Unexpected response format: {type(result)}"
                    log_progress(f"   ❌ {error}")
                    results['errors'].append(error)
                    objects = []

                if objects and len(objects) > 0:
                    if objects[0].get('response', {}).get('status', {}).get('status_code') == 'OK':
                        model_guid = objects[0].get('response', {}).get('header', {}).get('id_guid')
                        model_time = time.time() - model_start
                        log_progress(f"[OK] Model created ({model_time:.1f}s)")
                        results['model'] = model_name
                        results['model_guid'] = model_guid
                        
                        # Assign tag to model
                        print(f"🔍 DEBUG BEFORE TAG CALL: tag_name='{tag_name}', model_guid='{model_guid}'")
                        log_progress(f"Assigning tag '{tag_name}' to model...")
                        self.assign_tags_to_objects([model_guid], 'LOGICAL_TABLE', tag_name)

                        # Share model
                        _effective_share = share_with or get_admin_setting('SHARE_WITH', required=False)
                        if _effective_share:
                            log_progress(f"Sharing model with '{_effective_share}'...")
                            self.share_objects([model_guid], 'LOGICAL_TABLE', _effective_share)

                        # Step 3.5: Enable Spotter + enrich model semantics in a single export→update→reimport
                        # (create_new=True import ignores spotter_config, so we always re-import here)
                        try:
                            export_resp = self.session.post(
                                f"{self.base_url}/api/rest/2.0/metadata/tml/export",
                                json={
                                    "metadata": [{"identifier": model_guid, "type": "LOGICAL_TABLE"}],
                                    "export_associated": False,
                                    "format_type": "YAML"
                                }
                            )
                            if export_resp.status_code == 200:
                                export_data = export_resp.json()
                                if export_data and 'edoc' in export_data[0]:
                                    model_tml_dict = json.loads(export_data[0]['edoc'])

                                    # Enable Spotter
                                    model_tml_dict.setdefault('model', {}).setdefault('properties', {})['spotter_config'] = {'is_spotter_enabled': True}

                                    # Enrich with description, synonyms, and AI context
                                    if company_research:
                                        try:
                                            from model_semantic_updater import ModelSemanticUpdater
                                            log_progress("Generating model description, synonyms, and AI context...")
                                            sem_start = time.time()
                                            updater = ModelSemanticUpdater(self, llm_model=llm_model)

                                            model_description = updater.generate_model_description(
                                                company_research=company_research,
                                                use_case=use_case or '',
                                                company_name=company_name or '',
                                                model_name=model_name,
                                            )
                                            column_semantics = updater.generate_column_semantics(
                                                company_research=company_research,
                                                model_tml=model_tml_dict,
                                                use_case=use_case or '',
                                                company_name=company_name or '',
                                            )
                                            # Apply to TML dict in-place (returns YAML string)
                                            enriched_yaml = updater.apply_to_model_tml(
                                                model_tml_dict, column_semantics, model_description
                                            )
                                            # Parse back so we can still dump consistently below
                                            model_tml_dict = yaml.safe_load(enriched_yaml)
                                            sem_time = time.time() - sem_start
                                            log_progress(f"[OK] Semantics generated: {len(column_semantics)} columns enriched ({sem_time:.1f}s)")
                                        except Exception as sem_err:
                                            log_progress(f"[WARN] Semantic enrichment failed (non-fatal): {sem_err}")

                                    updated_tml = yaml.dump(model_tml_dict, allow_unicode=True, sort_keys=False)
                                    update_resp = self.session.post(
                                        f"{self.base_url}/api/rest/2.0/metadata/tml/import",
                                        json={
                                            "metadata_tmls": [updated_tml],
                                            "import_policy": "ALL_OR_NONE",
                                            "create_new": False
                                        }
                                    )
                                    if update_resp.status_code == 200:
                                        log_progress("🤖 Spotter enabled + model semantics applied")
                                    else:
                                        log_progress(f"🤖 Model update failed: HTTP {update_resp.status_code} — {update_resp.text[:200]}")
                                else:
                                    log_progress("🤖 Spotter enable: export returned no edoc")
                            else:
                                log_progress(f"🤖 Spotter enable: export failed HTTP {export_resp.status_code}")
                        except Exception as spotter_error:
                            log_progress(f"🤖 Spotter/semantics exception: {spotter_error}")

                        # Step 4: Auto-create Liveboard from model
                        lb_start = time.time()
                        
                        # HYBRID is the only supported liveboard creation method
                        method = 'HYBRID'
                        
                        log_progress(f"Creating liveboard ({method} method)...")
                        
                        try:
                            # Build company data from parameters
                            # Clean company name for display (strip .com, .org, etc)
                            clean_company = company_name.split('.')[0].title() if company_name and '.' in company_name else (company_name or 'Demo Company')
                            company_data = {
                                'name': clean_company,
                                'use_case': use_case or 'General Analytics'
                            }
                            
                            if method == 'HYBRID':
                                # HYBRID: MCP creates liveboard, TML post-processes

                                from liveboard_creator import create_liveboard_from_model_mcp, create_liveboard_from_model, enhance_mcp_liveboard
                                
                                # Get actual column names from ThoughtSpot model (not DDL)
                                # This is critical because TS may rename columns to make them unique
                                # e.g., PROCESSING_FEE becomes gift_processing_fee and tran_processing_fee
                                model_columns = self.get_model_columns(model_guid)
                                
                                if not model_columns:
                                    log_progress(f"   ⚠️ Could not get model columns, falling back to DDL")
                                    model_columns = []
                                    for table_name, columns_list in tables.items():
                                        for col in columns_list:
                                            model_columns.append(col)
                                
                                # Get liveboard questions from the vertical×function config
                                outlier_dicts = []
                                try:
                                    from demo_personas import parse_use_case, get_use_case_config
                                    uc_vertical, uc_function = parse_use_case(use_case or '')
                                    uc_config = get_use_case_config(uc_vertical or "Generic", uc_function or "Generic")
                                    lq = uc_config.get("liveboard_questions", [])
                                    required_qs = [q for q in lq if q.get("required")]
                                    optional_qs = [q for q in lq if not q.get("required")]
                                    for q in required_qs:
                                        outlier_dicts.append({
                                            'title': q['title'],
                                            'insight': q.get('insight', ''),
                                            'viz_type': q['viz_type'],
                                            'show_me_query': q['viz_question'],
                                            'kpi_companion': True,
                                            'spotter_questions': q.get('spotter_qs', []),
                                        })
                                    for q in optional_qs[:2]:
                                        outlier_dicts.append({
                                            'title': q['title'],
                                            'insight': q.get('insight', ''),
                                            'viz_type': q['viz_type'],
                                            'show_me_query': q['viz_question'],
                                            'kpi_companion': False,
                                            'spotter_questions': q.get('spotter_qs', []),
                                        })
                                    if outlier_dicts:
                                        log_progress(f"   [MCP] Using {len(outlier_dicts)} liveboard questions from {uc_vertical}×{uc_function}")
                                except Exception as outlier_err:
                                    log_progress(f"   [MCP] Liveboard questions loading skipped: {outlier_err}")
                                
                                # MCP creates liveboard
                                if method == 'HYBRID':
                                    log_progress(f"   Step 1/2: MCP creating initial liveboard...")
                                log_progress(f"   [MCP] Model: {model_name}, GUID: {model_guid}")
                                log_progress(f"   [MCP] Use case: {use_case or 'General Analytics'}")
                                log_progress(f"   [MCP] Using {len(model_columns)} columns from ThoughtSpot model")
                                
                                try:
                                    liveboard_result = create_liveboard_from_model_mcp(
                                        ts_client=self,
                                        model_id=model_guid,
                                        model_name=model_name,
                                        company_data=company_data,
                                        use_case=use_case or 'General Analytics',
                                        num_visualizations=10,
                                        liveboard_name=liveboard_name,
                                        outliers=outlier_dicts if outlier_dicts else None,
                                        llm_model=llm_model,
                                        model_columns=model_columns,
                                        prompt_logger=self.prompt_logger
                                    )
                                except Exception as mcp_error:
                                    import traceback
                                    error_trace = traceback.format_exc()
                                    log_progress(f"   [MCP ERROR] {type(mcp_error).__name__}: {str(mcp_error)}")
                                    liveboard_result = {'success': False, 'error': str(mcp_error), 'traceback': error_trace}
                                
                                # Log result
                                if liveboard_result.get('success'):
                                    log_progress(f"   [MCP] Liveboard created: {liveboard_result.get('liveboard_guid')}")
                                else:
                                    log_progress(f"   [MCP FAILED] {liveboard_result.get('error', 'Unknown error')}")
                                    log_progress("   [FALLBACK] Trying direct TML liveboard creation...")
                                    try:
                                        liveboard_result = create_liveboard_from_model(
                                            ts_client=self,
                                            model_id=model_guid,
                                            model_name=model_name,
                                            company_data=company_data,
                                            use_case=use_case or 'General Analytics',
                                            num_visualizations=10,
                                            liveboard_name=liveboard_name,
                                            llm_model=llm_model,
                                            outliers=outlier_dicts if outlier_dicts else None,
                                            model_columns=model_columns,
                                            prompt_logger=self.prompt_logger
                                        )
                                        if liveboard_result.get('success'):
                                            log_progress(f"   [FALLBACK OK] Liveboard created: {liveboard_result.get('liveboard_guid')}")
                                        else:
                                            log_progress(f"   [FALLBACK FAILED] {liveboard_result.get('error', 'Unknown error')}")
                                    except Exception as fallback_error:
                                        import traceback
                                        fallback_trace = traceback.format_exc()
                                        log_progress(f"   [FALLBACK ERROR] {type(fallback_error).__name__}: {str(fallback_error)}")
                                        liveboard_result = {
                                            'success': False,
                                            'error': f"MCP failed and fallback failed: {fallback_error}",
                                            'traceback': fallback_trace
                                        }
                                
                                # HYBRID: Add TML enhancement if MCP succeeded
                                if method == 'HYBRID' and liveboard_result.get('success') and liveboard_result.get('liveboard_guid'):
                                    log_progress(f"   Step 2/2: Enhancing with TML post-processing...")
                                    enhance_result = enhance_mcp_liveboard(
                                        liveboard_guid=liveboard_result['liveboard_guid'],
                                        company_data=company_data,
                                        ts_client=self,
                                        add_groups=True,
                                        fix_kpis=True,
                                        apply_brand_colors=True
                                    )
                                    if enhance_result.get('success'):
                                        log_progress(f"   [OK] Enhancement applied")
                                    else:
                                        enhance_err = f"TML enhancement failed: {enhance_result.get('message', 'unknown')[:100]}"
                                        log_progress(f"   [ERROR] {enhance_err}")
                                        results['errors'].append(enhance_err)

                            # Check result
                            print(f"🔍 DEBUG: Liveboard result received: {liveboard_result}")
                            print(f"🔍 DEBUG: Success flag: {liveboard_result.get('success')}")
                            
                            if liveboard_result.get('success'):
                                lb_time = time.time() - lb_start
                                log_progress(f"[OK] Liveboard created via {method} ({lb_time:.1f}s)")
                                results['liveboard'] = liveboard_result.get('liveboard_name')
                                results['liveboard_guid'] = liveboard_result.get('liveboard_guid')
                                results['liveboard_method'] = method
                                if liveboard_result.get('liveboard_url'):
                                    results['liveboard_url'] = liveboard_result.get('liveboard_url')
                                
                                # Assign tag to liveboard
                                if tag_name and liveboard_result.get('liveboard_guid'):
                                    log_progress(f"Assigning tag '{tag_name}' to liveboard...")
                                    self.assign_tags_to_objects([liveboard_result['liveboard_guid']], 'PINBOARD_ANSWER_BOOK', tag_name)

                                # Share liveboard
                                _effective_share = share_with or get_admin_setting('SHARE_WITH', required=False)
                                if _effective_share and liveboard_result.get('liveboard_guid'):
                                    log_progress(f"Sharing liveboard with '{_effective_share}'...")
                                    self.share_objects([liveboard_result['liveboard_guid']], 'LIVEBOARD', _effective_share)
                            else:
                                error = f"Liveboard creation failed: {liveboard_result.get('error', 'Unknown error')}"
                                print(f"❌ DEBUG: Liveboard creation failed! Error: {error}")
                                results['errors'].append(error)
                                log_progress(f"[ERROR] {error}")
                        except Exception as lb_error:
                            error = f"Liveboard creation exception: {str(lb_error)}"
                            results['errors'].append(error)
                            log_progress(f"[ERROR] {error}")
                    else:
                        # Extract detailed error information
                        obj_response = objects[0].get('response', {})
                        status = obj_response.get('status', {})
                        error_message = status.get('error_message', 'Unknown error')
                        
                        # Clean HTML tags from error message (ThoughtSpot sometimes returns HTML)
                        error_message = re.sub(r'<[^>]+>', '', error_message).strip()
                        if not error_message:
                            error_message = 'Schema validation failed (no details provided)'
                        
                        error_code = status.get('error_code', 'N/A')
                        
                        # Try to extract additional error details from various response fields
                        error_details = []
                        
                        # Check for detailed error messages in different response structures
                        if 'error_details' in status:
                            error_details.append(f"Error details: {status.get('error_details')}")
                        
                        if 'validation_errors' in obj_response:
                            error_details.append(f"Validation errors: {obj_response.get('validation_errors')}")
                        
                        if 'warnings' in obj_response:
                            error_details.append(f"Warnings: {obj_response.get('warnings')}")
                        
                        # Check header for additional info
                        header = obj_response.get('header', {})
                        if 'error' in header:
                            error_details.append(f"Header error: {header.get('error')}")
                        
                        # Get any additional error details
                        full_response = json.dumps(objects[0], indent=2)
                        
                        # Save the TML that failed for debugging
                        import tempfile
                        # os is already imported at module level
                        try:
                            debug_dir = os.path.join(tempfile.gettempdir(), 'thoughtspot_debug')
                            os.makedirs(debug_dir, exist_ok=True)
                            failed_tml_path = os.path.join(debug_dir, f'failed_model_{datetime.now().strftime("%Y%m%d_%H%M%S")}.tml')
                            with open(failed_tml_path, 'w') as f:
                                f.write(model_tml)
                            log_progress(f"💾 Failed TML saved to: {failed_tml_path}")
                            print(f"💾 Failed TML saved to: {failed_tml_path}")
                        except Exception as save_error:
                            log_progress(f"[WARN] Could not save failed TML: {save_error}")
                        
                        # Build comprehensive error message
                        error = f"Model validation failed: {error_message}"
                        if error_code != 'N/A':
                            error += f" (Error code: {error_code})"
                        
                        if error_details:
                            error += f"\n\nAdditional details:\n" + "\n".join(error_details)
                        
                        print(f"📋 Full model response: {full_response}")  # DEBUG: Show full response
                        print(f"   ❌ {error}")
                        log_progress(f"   ❌ {error}")
                        log_progress(f"   📋 Full response details:")
                        log_progress(f"{full_response}")
                        
                        # Log full TML for debugging
                        log_progress(f"\n📄 TML that was sent:\n{model_tml}")
                        
                        results['errors'].append(error)
                        results['errors'].append(f"Full API response: {full_response}")
                        results['errors'].append(f"Failed TML saved to: {failed_tml_path if 'failed_tml_path' in locals() else 'N/A'}")
                else:
                    error = "Model failed: No objects in response"
                    log_progress(f"   ❌ {error}")
                    results['errors'].append(error)

            # Mark as successful if we got this far
            results['success'] = len(results['errors']) == 0
            
        except Exception as e:
            import traceback
            error_msg = str(e)
            full_trace = traceback.format_exc()
            
            # Log to console with full details
            print(f"\n{'='*60}")
            print(f"❌ DEPLOYMENT EXCEPTION")
            print(f"{'='*60}")
            print(f"Error: {error_msg}")
            print(f"\nFull traceback:")
            print(full_trace)
            print(f"{'='*60}\n")
            
            # Log through callback too
            log_progress(f"[ERROR] Deployment failed: {error_msg}")
            log_progress(f"Traceback: {full_trace}")
            
            results['errors'].append(error_msg)
            results['errors'].append(f"Traceback: {full_trace}")
        
        return results


def deploy_to_thoughtspot(ddl: str, database: str, schema: str, 
                         connection_name: str = None, company_name: str = None, 
                         use_case: str = None, progress_callback=None) -> Dict:
    """
    Convenience function for deploying to ThoughtSpot
    
    Args:
        ddl: Data Definition Language statements
        database: Target database name
        schema: Target schema name
        connection_name: Optional connection name
        progress_callback: Optional callback for progress updates
        
    Returns:
        Dict with deployment results
    """
    deployer = ThoughtSpotDeployer()
    return deployer.deploy_all(ddl, database, schema, connection_name, company_name, use_case, progress_callback)


if __name__ == "__main__":
    # Example usage
    test_ddl = """
    CREATE TABLE CUSTOMERS (
    CUSTOMERID INT64 PRIMARY KEY,
    NAME VARCHAR(255)
);
    """
    
    # Test deployment - using a schema that exists
    results = deploy_to_thoughtspot(
        ddl=test_ddl,
        database="DEMOBUILD",  # Use the actual Snowflake database
        schema="THOUGHTSPO_SALESA_20250915_193303"  # Use the working schema from your working table
    )
    
    print("\n" + "=" * 60)
    print("📊 DEPLOYMENT RESULTS:")
    print("=" * 60)
    print(json.dumps(results, indent=2))