Spaces:

APPONTE
/

agent-seara

Sleeping

File size: 40,565 Bytes

e982206

"""
Nó para geração de gráficos
"""
import io
import logging
import numpy as np
import pandas as pd
import matplotlib.pyplot as plt
import matplotlib.dates as mdates
from PIL import Image
from typing import Dict, Any, Optional

from utils.object_manager import get_object_manager

async def graph_generation_node(state: Dict[str, Any]) -> Dict[str, Any]:
    """
    Nó para geração de gráficos baseado no tipo selecionado
    
    Args:
        state: Estado atual do agente
        
    Returns:
        Estado atualizado com gráfico gerado
    """
    try:
        logging.info("[GRAPH_GENERATION] Iniciando geração de gráfico")
        
        # Verifica se há tipo de gráfico selecionado
        graph_type = state.get("graph_type")
        if not graph_type:
            logging.info("[GRAPH_GENERATION] Nenhum tipo de gráfico selecionado, pulando geração")
            return state
        
        # Verifica se há erro anterior
        if state.get("graph_error"):
            logging.info("[GRAPH_GENERATION] Erro anterior detectado, pulando geração")
            return state
        
        # Recupera dados do gráfico
        graph_data = state.get("graph_data", {})
        data_id = graph_data.get("data_id")
        
        if not data_id:
            error_msg = "ID dos dados do gráfico não encontrado"
            logging.error(f"[GRAPH_GENERATION] {error_msg}")
            state.update({
                "graph_error": error_msg,
                "graph_generated": False
            })
            return state
        
        # Recupera DataFrame dos dados
        obj_manager = get_object_manager()
        df = obj_manager.get_object(data_id)
        
        if df is None or df.empty:
            error_msg = "Dados do gráfico não encontrados ou vazios"
            logging.error(f"[GRAPH_GENERATION] {error_msg}")
            state.update({
                "graph_error": error_msg,
                "graph_generated": False
            })
            return state
        
        # Gera título do gráfico baseado na pergunta do usuário
        user_query = state.get("user_input", "")
        title = f"Visualização: {user_query[:50]}..." if len(user_query) > 50 else f"Visualização: {user_query}"
        
        # Gera o gráfico
        graph_image = await generate_graph(df, graph_type, title, user_query)
        
        if graph_image is None:
            error_msg = f"Falha ao gerar gráfico do tipo {graph_type}"
            logging.error(f"[GRAPH_GENERATION] {error_msg}")
            state.update({
                "graph_error": error_msg,
                "graph_generated": False
            })
            return state
        
        # Armazena imagem do gráfico no ObjectManager
        graph_image_id = obj_manager.store_object(graph_image, "graph_image")
        
        # Atualiza estado
        state.update({
            "graph_image_id": graph_image_id,
            "graph_generated": True,
            "graph_error": None
        })
        
        logging.info(f"[GRAPH_GENERATION] Gráfico gerado com sucesso: {graph_type}")
        
    except Exception as e:
        error_msg = f"Erro na geração de gráfico: {e}"
        logging.error(f"[GRAPH_GENERATION] {error_msg}")
        state.update({
            "graph_error": error_msg,
            "graph_generated": False
        })
    
    return state

async def generate_graph(df: pd.DataFrame, graph_type: str, title: str = None, user_query: str = None) -> Optional[Image.Image]:
    """
    Gera um gráfico com base no DataFrame e tipo especificado
    
    Args:
        df: DataFrame com os dados
        graph_type: Tipo de gráfico a ser gerado
        title: Título do gráfico
        user_query: Pergunta original do usuário
        
    Returns:
        Imagem PIL do gráfico ou None se falhar
    """
    logging.info(f"[GRAPH_GENERATION] Gerando gráfico tipo {graph_type}. DataFrame: {len(df)} linhas")
    
    if df.empty:
        logging.warning("[GRAPH_GENERATION] DataFrame vazio")
        return None
    
    try:
        # Preparar dados usando lógica UNIFICADA
        prepared_df = prepare_data_for_graph_unified(df, graph_type, user_query)
        if prepared_df.empty:
            logging.warning("[GRAPH_GENERATION] DataFrame preparado está vazio")
            return None
        
        # Configurações gerais
        plt.style.use('default')
        colors = plt.cm.tab10.colors
        
        # Gerar gráfico baseado no tipo
        if graph_type == 'line_simple':
            return await generate_line_simple(prepared_df, title, colors)
        elif graph_type == 'multiline':
            return await generate_multiline(prepared_df, title, colors)
        elif graph_type == 'area':
            return await generate_area(prepared_df, title, colors)
        elif graph_type == 'bar_vertical':
            return await generate_bar_vertical(prepared_df, title, colors)
        elif graph_type == 'bar_horizontal':
            return await generate_bar_horizontal(prepared_df, title, colors)
        elif graph_type == 'bar_grouped':
            return await generate_bar_grouped(prepared_df, title, colors)
        elif graph_type == 'bar_stacked':
            return await generate_bar_stacked(prepared_df, title, colors)
        elif graph_type == 'pie':
            return await generate_pie(prepared_df, title, colors)
        elif graph_type == 'donut':
            return await generate_donut(prepared_df, title, colors)
        elif graph_type == 'pie_multiple':
            return await generate_pie_multiple(prepared_df, title, colors)
        else:
            logging.warning(f"[GRAPH_GENERATION] Tipo '{graph_type}' não reconhecido, usando bar_vertical")
            return await generate_bar_vertical(prepared_df, title, colors)
            
    except Exception as e:
        logging.error(f"[GRAPH_GENERATION] Erro ao gerar gráfico: {e}")
        return None

def analyze_dataframe_structure(df: pd.DataFrame) -> Dict[str, Any]:
    """
    Analisa a estrutura do DataFrame e retorna informações detalhadas

    Args:
        df: DataFrame a ser analisado

    Returns:
        Dicionário com informações sobre tipos de colunas e estrutura
    """
    if df.empty:
        return {
            'numeric_cols': [],
            'date_cols': [],
            'categorical_cols': [],
            'total_cols': 0,
            'has_multiple_numerics': False,
            'has_multiple_categoricals': False,
            'is_suitable_for_grouping': False
        }

    # Analisar tipos de colunas de forma mais robusta
    numeric_cols = []
    date_cols = []
    categorical_cols = []

    for col in df.columns:
        col_data = df[col]

        # Verificar se é numérico (incluindo strings que representam números)
        if pd.api.types.is_numeric_dtype(col_data):
            numeric_cols.append(col)
        elif col_data.dtype == 'object':
            # Tentar converter para numérico
            try:
                test_numeric = pd.to_numeric(col_data.astype(str).str.replace(',', '.'), errors='coerce')
                if test_numeric.notna().sum() > len(col_data) * 0.8:  # 80% são números válidos
                    numeric_cols.append(col)
                else:
                    # Verificar se é data
                    if any(date_indicator in col.lower() for date_indicator in ['data', 'date', 'time', 'dia', 'mes', 'ano']):
                        try:
                            pd.to_datetime(col_data.head(3), errors='raise')
                            date_cols.append(col)
                        except:
                            categorical_cols.append(col)
                    else:
                        categorical_cols.append(col)
            except:
                categorical_cols.append(col)
        elif pd.api.types.is_datetime64_any_dtype(col_data):
            date_cols.append(col)
        else:
            categorical_cols.append(col)

    return {
        'numeric_cols': numeric_cols,
        'date_cols': date_cols,
        'categorical_cols': categorical_cols,
        'total_cols': len(df.columns),
        'has_multiple_numerics': len(numeric_cols) >= 2,
        'has_multiple_categoricals': len(categorical_cols) >= 2,
        'is_suitable_for_grouping': len(categorical_cols) >= 2 or (len(categorical_cols) >= 1 and len(numeric_cols) >= 2)
    }

def prepare_data_for_graph_unified(df: pd.DataFrame, graph_type: str, user_query: str = None) -> pd.DataFrame:
    """
    FUNÇÃO UNIFICADA para preparação de dados - substitui lógica duplicada

    Args:
        df: DataFrame original
        graph_type: Tipo de gráfico
        user_query: Pergunta do usuário

    Returns:
        DataFrame preparado com colunas adequadas para o tipo de gráfico
    """
    logging.info(f"[GRAPH_GENERATION] 🔧 Preparação UNIFICADA para {graph_type}")

    if df.empty:
        logging.warning("[GRAPH_GENERATION] DataFrame vazio")
        return df

    # Fazer cópia para não modificar original
    prepared_df = df.copy()

    # Analisar estrutura do DataFrame
    structure = analyze_dataframe_structure(prepared_df)
    numeric_cols = structure['numeric_cols']
    date_cols = structure['date_cols']
    categorical_cols = structure['categorical_cols']

    logging.info(f"[GRAPH_GENERATION] 📊 Estrutura: {len(numeric_cols)} numéricas, {len(date_cols)} datas, {len(categorical_cols)} categóricas")

    # Preparação específica por tipo de gráfico
    if graph_type in ['line_simple', 'area']:
        return _prepare_for_temporal_graphs(prepared_df, date_cols, numeric_cols, categorical_cols)

    elif graph_type in ['bar_vertical', 'bar_horizontal']:
        return _prepare_for_simple_bar_graphs(prepared_df, categorical_cols, numeric_cols, graph_type)

    elif graph_type in ['bar_grouped', 'bar_stacked']:
        return _prepare_for_grouped_graphs(prepared_df, structure, graph_type)

    elif graph_type in ['pie', 'donut', 'pie_multiple']:
        return _prepare_for_pie_graphs(prepared_df, categorical_cols, numeric_cols, graph_type)

    elif graph_type == 'multiline':
        return _prepare_for_multiline_graphs(prepared_df, structure)

    else:
        logging.warning(f"[GRAPH_GENERATION] Tipo {graph_type} não reconhecido, usando preparação básica")
        return _prepare_basic_fallback(prepared_df, categorical_cols, numeric_cols)

def _prepare_for_temporal_graphs(df: pd.DataFrame, date_cols: list, numeric_cols: list, categorical_cols: list) -> pd.DataFrame:
    """Prepara dados para gráficos temporais (linha, área)"""
    if date_cols and numeric_cols:
        # Usar primeira coluna de data e primeira numérica
        x_col, y_col = date_cols[0], numeric_cols[0]
        result_df = df[[x_col, y_col]].sort_values(by=x_col)
        logging.info(f"[GRAPH_GENERATION] 📅 Temporal: {x_col} (data) + {y_col} (numérica)")
        return result_df
    elif categorical_cols and numeric_cols:
        # Usar primeira categórica e primeira numérica
        x_col, y_col = categorical_cols[0], numeric_cols[0]
        result_df = df[[x_col, y_col]].sort_values(by=y_col)
        logging.info(f"[GRAPH_GENERATION] 📊 Categórico: {x_col} + {y_col}")
        return result_df
    else:
        logging.warning("[GRAPH_GENERATION] Dados insuficientes para gráfico temporal")
        return df

def _prepare_for_simple_bar_graphs(df: pd.DataFrame, categorical_cols: list, numeric_cols: list, graph_type: str) -> pd.DataFrame:
    """Prepara dados para gráficos de barras simples"""
    if categorical_cols and numeric_cols:
        x_col, y_col = categorical_cols[0], numeric_cols[0]
        result_df = df[[x_col, y_col]].sort_values(by=y_col, ascending=False)

        # Limitar categorias para barras verticais
        if graph_type == 'bar_vertical' and len(result_df) > 15:
            result_df = result_df.head(15)
            logging.info(f"[GRAPH_GENERATION] 📊 Limitado a 15 categorias para {graph_type}")

        logging.info(f"[GRAPH_GENERATION] 📊 Barras simples: {x_col} + {y_col}")
        return result_df
    else:
        logging.warning("[GRAPH_GENERATION] Dados insuficientes para gráfico de barras")
        return df

def _prepare_for_grouped_graphs(df: pd.DataFrame, structure: dict, graph_type: str) -> pd.DataFrame:
    """
    FUNÇÃO CRÍTICA: Prepara dados para gráficos agrupados com lógica inteligente
    """
    numeric_cols = structure['numeric_cols']
    categorical_cols = structure['categorical_cols']
    has_multiple_numerics = structure['has_multiple_numerics']
    has_multiple_categoricals = structure['has_multiple_categoricals']

    logging.info(f"[GRAPH_GENERATION] 🎯 Preparando agrupado: {len(numeric_cols)} num, {len(categorical_cols)} cat")

    if has_multiple_numerics:
        # CENÁRIO 1: Múltiplas numéricas - usar primeira categórica + todas numéricas
        cols_to_keep = [categorical_cols[0]] + numeric_cols
        result_df = df[cols_to_keep]
        logging.info(f"[GRAPH_GENERATION] ✅ Múltiplas numéricas: {cols_to_keep}")
        return result_df

    elif len(numeric_cols) == 1 and has_multiple_categoricals:
        # CENÁRIO 2: 1 numérica + múltiplas categóricas - AGRUPAMENTO POR COR
        # Usar TODAS as categóricas + a numérica
        cols_to_keep = categorical_cols + numeric_cols
        result_df = df[cols_to_keep]
        logging.info(f"[GRAPH_GENERATION] ✅ Agrupamento por cor: {cols_to_keep}")
        return result_df

    elif len(numeric_cols) == 1 and len(categorical_cols) == 1:
        # CENÁRIO 3: 1 numérica + 1 categórica - gráfico simples
        cols_to_keep = categorical_cols + numeric_cols
        result_df = df[cols_to_keep]
        logging.info(f"[GRAPH_GENERATION] ⚠️ Dados simples para agrupado: {cols_to_keep}")
        return result_df

    else:
        # CENÁRIO 4: Dados inadequados
        logging.warning("[GRAPH_GENERATION] ❌ Dados inadequados para gráfico agrupado")
        return df

def _prepare_for_pie_graphs(df: pd.DataFrame, categorical_cols: list, numeric_cols: list, graph_type: str) -> pd.DataFrame:
    """Prepara dados para gráficos de pizza"""
    if categorical_cols and numeric_cols:
        cat_col, val_col = categorical_cols[0], numeric_cols[0]

        if graph_type == 'pie_multiple' and len(categorical_cols) >= 2:
            # Para pizzas múltiplas, manter 2 categóricas + 1 numérica
            result_df = df[[categorical_cols[0], categorical_cols[1], val_col]]
            logging.info(f"[GRAPH_GENERATION] 🥧 Pizzas múltiplas: {result_df.columns.tolist()}")
        else:
            # Agrupar e somar valores para pizza simples/donut
            result_df = df.groupby(cat_col)[val_col].sum().reset_index()
            result_df = result_df.sort_values(by=val_col, ascending=False)

            # Limitar a 10 categorias
            if len(result_df) > 10:
                top_9 = result_df.head(9)
                others_sum = result_df.iloc[9:][val_col].sum()
                if others_sum > 0:
                    others_row = pd.DataFrame({cat_col: ['Outros'], val_col: [others_sum]})
                    result_df = pd.concat([top_9, others_row], ignore_index=True)
                else:
                    result_df = top_9

            logging.info(f"[GRAPH_GENERATION] 🥧 Pizza: {cat_col} + {val_col} ({len(result_df)} categorias)")

        return result_df
    else:
        logging.warning("[GRAPH_GENERATION] Dados insuficientes para gráfico de pizza")
        return df

def _prepare_for_multiline_graphs(df: pd.DataFrame, structure: dict) -> pd.DataFrame:
    """Prepara dados para gráficos de múltiplas linhas"""
    date_cols = structure['date_cols']
    numeric_cols = structure['numeric_cols']
    categorical_cols = structure['categorical_cols']

    if date_cols and len(numeric_cols) >= 2:
        # Data + múltiplas numéricas
        cols_to_keep = [date_cols[0]] + numeric_cols
        result_df = df[cols_to_keep].sort_values(by=date_cols[0])
        logging.info(f"[GRAPH_GENERATION] 📈 Multilinhas temporais: {cols_to_keep}")
        return result_df
    elif categorical_cols and len(numeric_cols) >= 2:
        # Categórica + múltiplas numéricas
        cols_to_keep = [categorical_cols[0]] + numeric_cols
        result_df = df[cols_to_keep]
        logging.info(f"[GRAPH_GENERATION] 📈 Multilinhas categóricas: {cols_to_keep}")
        return result_df
    else:
        logging.warning("[GRAPH_GENERATION] Dados insuficientes para multilinhas")
        return df

def _prepare_basic_fallback(df: pd.DataFrame, categorical_cols: list, numeric_cols: list) -> pd.DataFrame:
    """Preparação básica de fallback"""
    if categorical_cols and numeric_cols:
        result_df = df[[categorical_cols[0], numeric_cols[0]]]
        logging.info(f"[GRAPH_GENERATION] 🔄 Fallback básico: {result_df.columns.tolist()}")
        return result_df
    else:
        logging.warning("[GRAPH_GENERATION] Dados inadequados para qualquer gráfico")
        return df

def save_plot_to_image() -> Image.Image:
    """
    Salva o plot atual do matplotlib como imagem PIL

    Returns:
        Imagem PIL
    """
    buf = io.BytesIO()
    plt.savefig(buf, format='png', dpi=100, bbox_inches='tight', facecolor='white')
    buf.seek(0)
    img = Image.open(buf)
    plt.close()  # Importante: fechar o plot para liberar memória
    return img

# ==================== FUNÇÕES DE GERAÇÃO ESPECÍFICAS ====================

async def generate_line_simple(df: pd.DataFrame, title: str, colors) -> Optional[Image.Image]:
    """Gera gráfico de linha simples"""
    if len(df.columns) < 2:
        return None

    x_col, y_col = df.columns[0], df.columns[1]
    is_date = pd.api.types.is_datetime64_any_dtype(df[x_col])

    plt.figure(figsize=(12, 6))

    if is_date:
        plt.plot(df[x_col], df[y_col], marker='o', linewidth=2, color=colors[0])
        plt.gcf().autofmt_xdate()
        plt.gca().xaxis.set_major_formatter(mdates.DateFormatter('%d/%m/%Y'))
    else:
        plt.plot(range(len(df)), df[y_col], marker='o', linewidth=2, color=colors[0])
        plt.xticks(range(len(df)), df[x_col], rotation=45, ha='right')

    plt.xlabel(x_col)
    plt.ylabel(y_col)
    plt.title(title or f"{y_col} por {x_col}")
    plt.grid(True, linestyle='--', alpha=0.7)
    plt.tight_layout()

    return save_plot_to_image()

async def generate_multiline(df: pd.DataFrame, title: str, colors) -> Optional[Image.Image]:
    """Gera gráfico de múltiplas linhas"""
    if len(df.columns) < 2:
        return None

    x_col = df.columns[0]
    y_cols = [col for col in df.columns[1:] if pd.api.types.is_numeric_dtype(df[col])]

    if not y_cols:
        return await generate_line_simple(df, title, colors)

    is_date = pd.api.types.is_datetime64_any_dtype(df[x_col])

    plt.figure(figsize=(12, 6))

    for i, y_col in enumerate(y_cols):
        if is_date:
            plt.plot(df[x_col], df[y_col], marker='o', linewidth=2,
                    label=y_col, color=colors[i % len(colors)])
        else:
            plt.plot(range(len(df)), df[y_col], marker='o', linewidth=2,
                    label=y_col, color=colors[i % len(colors)])

    if is_date:
        plt.gcf().autofmt_xdate()
        plt.gca().xaxis.set_major_formatter(mdates.DateFormatter('%d/%m/%Y'))
    else:
        plt.xticks(range(len(df)), df[x_col], rotation=45, ha='right')

    plt.xlabel(x_col)
    plt.ylabel("Valores")
    plt.title(title or f"Comparação por {x_col}")
    plt.legend(title="Séries", loc='best')
    plt.grid(True, linestyle='--', alpha=0.7)
    plt.tight_layout()

    return save_plot_to_image()

async def generate_area(df: pd.DataFrame, title: str, colors) -> Optional[Image.Image]:
    """Gera gráfico de área"""
    if len(df.columns) < 2:
        return None

    x_col, y_col = df.columns[0], df.columns[1]
    is_date = pd.api.types.is_datetime64_any_dtype(df[x_col])

    plt.figure(figsize=(12, 6))

    if is_date:
        plt.fill_between(df[x_col], df[y_col], alpha=0.5, color=colors[0])
        plt.plot(df[x_col], df[y_col], color=colors[0], linewidth=2)
        plt.gcf().autofmt_xdate()
        plt.gca().xaxis.set_major_formatter(mdates.DateFormatter('%d/%m/%Y'))
    else:
        plt.fill_between(range(len(df)), df[y_col], alpha=0.5, color=colors[0])
        plt.plot(range(len(df)), df[y_col], color=colors[0], linewidth=2)
        plt.xticks(range(len(df)), df[x_col], rotation=45, ha='right')

    plt.xlabel(x_col)
    plt.ylabel(y_col)
    plt.title(title or f"{y_col} por {x_col}")
    plt.grid(True, linestyle='--', alpha=0.7)
    plt.tight_layout()

    return save_plot_to_image()

async def generate_bar_vertical(df: pd.DataFrame, title: str, colors) -> Optional[Image.Image]:
    """Gera gráfico de barras verticais"""
    if len(df.columns) < 2:
        return None

    x_col, y_col = df.columns[0], df.columns[1]

    # Preparar dados numéricos - converter strings com vírgula para float
    df_plot = df.copy()
    try:
        if df_plot[y_col].dtype == 'object':
            # Converte strings para números, tratando vírgulas como separador decimal
            df_plot[y_col] = pd.to_numeric(df_plot[y_col].astype(str).str.replace(',', '.'), errors='coerce')

        # Remove linhas com valores não numéricos
        df_plot = df_plot.dropna(subset=[y_col])

        if df_plot.empty:
            logging.error(f"[GRAPH_GENERATION] Nenhum valor numérico válido encontrado na coluna {y_col}")
            return None

    except Exception as e:
        logging.error(f"[GRAPH_GENERATION] Erro ao converter dados para numérico: {e}")
        return None

    plt.figure(figsize=(12, 8))
    bars = plt.bar(range(len(df_plot)), df_plot[y_col], color=colors[0])

    # Adicionar valores nas barras
    try:
        max_value = df_plot[y_col].max()
        for i, bar in enumerate(bars):
            height = bar.get_height()
            if isinstance(height, (int, float)) and not pd.isna(height):
                plt.text(bar.get_x() + bar.get_width()/2., height + 0.02 * max_value,
                        f'{height:,.0f}', ha='center', fontsize=9)
    except Exception as e:
        logging.warning(f"[GRAPH_GENERATION] Erro ao adicionar valores nas barras: {e}")

    plt.xlabel(x_col)
    plt.ylabel(y_col)
    plt.title(title or f"{y_col} por {x_col}")
    plt.xticks(range(len(df_plot)), df_plot[x_col], rotation=45, ha='right')
    plt.grid(True, linestyle='--', alpha=0.7, axis='y')
    plt.tight_layout()

    return save_plot_to_image()

async def generate_bar_horizontal(df: pd.DataFrame, title: str, colors) -> Optional[Image.Image]:
    """Gera gráfico de barras horizontais"""
    if len(df.columns) < 2:
        return None

    x_col, y_col = df.columns[0], df.columns[1]

    # Preparar dados numéricos - converter strings com vírgula para float
    df_plot = df.copy()
    try:
        if df_plot[y_col].dtype == 'object':
            # Converte strings para números, tratando vírgulas como separador decimal
            df_plot[y_col] = pd.to_numeric(df_plot[y_col].astype(str).str.replace(',', '.'), errors='coerce')

        # Remove linhas com valores não numéricos
        df_plot = df_plot.dropna(subset=[y_col])

        if df_plot.empty:
            logging.error(f"[GRAPH_GENERATION] Nenhum valor numérico válido encontrado na coluna {y_col}")
            return None

    except Exception as e:
        logging.error(f"[GRAPH_GENERATION] Erro ao converter dados para numérico: {e}")
        return None

    plt.figure(figsize=(12, max(6, len(df_plot) * 0.4)))
    bars = plt.barh(range(len(df_plot)), df_plot[y_col], color=colors[0])

    # Adicionar valores nas barras
    try:
        max_value = df_plot[y_col].max()
        for i, bar in enumerate(bars):
            width = bar.get_width()
            if isinstance(width, (int, float)) and not pd.isna(width):
                plt.text(width + 0.02 * max_value, bar.get_y() + bar.get_height()/2.,
                        f'{width:,.0f}', va='center', fontsize=9)
    except Exception as e:
        logging.warning(f"[GRAPH_GENERATION] Erro ao adicionar valores nas barras: {e}")

    plt.xlabel(y_col)
    plt.ylabel(x_col)
    plt.title(title or f"{y_col} por {x_col}")
    plt.yticks(range(len(df_plot)), df_plot[x_col])
    plt.grid(True, linestyle='--', alpha=0.7, axis='x')
    plt.tight_layout()

    return save_plot_to_image()

async def generate_bar_grouped(df: pd.DataFrame, title: str, colors) -> Optional[Image.Image]:
    """
    FUNÇÃO REFATORADA: Gera gráfico de barras agrupadas com fallbacks inteligentes
    """
    logging.info(f"[GRAPH_GENERATION] 🎯 Gerando barras agrupadas REFATORADO. Colunas: {df.columns.tolist()}")

    if len(df.columns) < 2:
        logging.warning("[GRAPH_GENERATION] ❌ Dados insuficientes para gráfico agrupado")
        return None

    # Analisar estrutura dos dados
    structure = analyze_dataframe_structure(df)
    numeric_cols = structure['numeric_cols']
    categorical_cols = structure['categorical_cols']

    logging.info(f"[GRAPH_GENERATION] 📊 Estrutura: {len(numeric_cols)} numéricas, {len(categorical_cols)} categóricas")

    if not numeric_cols:
        logging.warning("[GRAPH_GENERATION] ❌ Nenhuma coluna numérica encontrada")
        return await generate_bar_vertical(df, title, colors)

    # DECISÃO INTELIGENTE baseada na estrutura dos dados
    if len(numeric_cols) >= 2:
        # CENÁRIO 1: Múltiplas numéricas - gráfico agrupado tradicional
        return await _generate_multi_numeric_grouped(df, title, colors, categorical_cols[0], numeric_cols)

    elif len(numeric_cols) == 1 and len(categorical_cols) >= 2:
        # CENÁRIO 2: 1 numérica + múltiplas categóricas - agrupamento por cor
        return await _generate_color_grouped_bars(df, title, colors, categorical_cols, numeric_cols[0])

    elif len(numeric_cols) == 1 and len(categorical_cols) == 1:
        # CENÁRIO 3: Dados simples - fallback inteligente para barras verticais
        logging.info("[GRAPH_GENERATION] ⚠️ Dados simples, usando barras verticais")
        return await generate_bar_vertical(df, title, colors)

    else:
        # CENÁRIO 4: Estrutura inadequada
        logging.warning("[GRAPH_GENERATION] ❌ Estrutura de dados inadequada para agrupamento")
        return await generate_bar_vertical(df, title, colors)

async def _generate_multi_numeric_grouped(df: pd.DataFrame, title: str, colors, x_col: str, y_cols: list) -> Optional[Image.Image]:
    """
    Gera gráfico agrupado com múltiplas colunas numéricas (cenário tradicional)
    """
    logging.info(f"[GRAPH_GENERATION] 📊 Múltiplas numéricas: {x_col} + {y_cols}")

    # Converter colunas numéricas se necessário
    for col in y_cols:
        if df[col].dtype == 'object':
            df[col] = pd.to_numeric(df[col].astype(str).str.replace(',', '.'), errors='coerce')

    # Remover linhas com valores NaN
    df_clean = df.dropna(subset=y_cols)

    if df_clean.empty:
        logging.error("[GRAPH_GENERATION] ❌ Todos os valores são NaN após conversão")
        return None

    # Verificar diferença de escala entre colunas
    col_ranges = {col: df_clean[col].max() - df_clean[col].min() for col in y_cols}
    max_range = max(col_ranges.values())
    min_range = min(col_ranges.values())

    if max_range > 0 and min_range > 0 and (max_range / min_range) > 100:
        # Escalas muito diferentes - usar eixos duplos
        logging.info("[GRAPH_GENERATION] 📊 Escalas diferentes, usando eixos duplos")
        return await _generate_dual_axis_chart(df_clean, title, colors, x_col, y_cols[0], y_cols[1])

    # Gráfico agrupado normal
    x_pos = np.arange(len(df_clean))
    width = 0.8 / len(y_cols)

    fig, ax = plt.subplots(figsize=(14, 8))

    for i, col in enumerate(y_cols):
        offset = width * i - width * (len(y_cols) - 1) / 2
        bars = ax.bar(x_pos + offset, df_clean[col], width, label=col,
                     color=colors[i % len(colors)], alpha=0.8)

        # Adicionar valores nas barras
        for bar in bars:
            height = bar.get_height()
            if height > 0:
                ax.text(bar.get_x() + bar.get_width()/2., height + height * 0.02,
                       f'{height:.0f}', ha='center', fontsize=8)

    ax.set_xlabel(x_col)
    ax.set_ylabel('Valores')
    ax.set_title(title or f"Comparação de {', '.join(y_cols)} por {x_col}")
    ax.set_xticks(x_pos)
    ax.set_xticklabels(df_clean[x_col], rotation=45, ha='right')
    ax.legend()
    ax.grid(True, linestyle='--', alpha=0.7, axis='y')
    plt.tight_layout()

    logging.info(f"[GRAPH_GENERATION] ✅ Gráfico agrupado tradicional criado: {len(y_cols)} métricas")
    return save_plot_to_image()

async def _generate_color_grouped_bars(df: pd.DataFrame, title: str, colors, categorical_cols: list, y_col: str) -> Optional[Image.Image]:
    """
    Gera gráfico agrupado por cor usando múltiplas categóricas (CENÁRIO CRÍTICO)
    """
    x_col = categorical_cols[0]
    group_col = categorical_cols[1] if len(categorical_cols) > 1 else None

    logging.info(f"[GRAPH_GENERATION] 🎨 Agrupamento por cor: {x_col} (X) + {y_col} (Y) + {group_col} (cor)")

    if not group_col:
        logging.warning("[GRAPH_GENERATION] ⚠️ Sem coluna para agrupamento, usando gráfico simples")
        return await generate_bar_vertical(df[[x_col, y_col]], title, colors)

    # Converter coluna numérica se necessário
    if df[y_col].dtype == 'object':
        df[y_col] = pd.to_numeric(df[y_col].astype(str).str.replace(',', '.'), errors='coerce')

    # Remover linhas com valores NaN
    df_clean = df.dropna(subset=[y_col])

    if df_clean.empty:
        logging.error("[GRAPH_GENERATION] ❌ Todos os valores são NaN após conversão")
        return None

    # Obter categorias únicas
    unique_groups = df_clean[group_col].unique()
    unique_x = df_clean[x_col].unique()

    logging.info(f"[GRAPH_GENERATION] 🎯 Grupos: {unique_groups} | X: {len(unique_x)} categorias")

    # Configurar gráfico
    x_pos = np.arange(len(unique_x))
    width = 0.8 / len(unique_groups)

    fig, ax = plt.subplots(figsize=(14, 8))

    # Criar barras para cada grupo
    for i, group in enumerate(unique_groups):
        group_data = df_clean[df_clean[group_col] == group]

        # Criar array de valores para cada posição X
        values = []
        for x_val in unique_x:
            matching_rows = group_data[group_data[x_col] == x_val]
            if not matching_rows.empty:
                values.append(matching_rows[y_col].iloc[0])
            else:
                values.append(0)

        # Calcular posição das barras
        offset = width * i - width * (len(unique_groups) - 1) / 2
        bars = ax.bar(x_pos + offset, values, width, label=f"{group_col}: {group}",
                     color=colors[i % len(colors)], alpha=0.8)

        # Adicionar valores nas barras
        for bar, value in zip(bars, values):
            if value > 0:
                ax.text(bar.get_x() + bar.get_width()/2., value + value * 0.02,
                       f'{value:.0f}', ha='center', fontsize=8)

    # Configurações do gráfico
    ax.set_xlabel(x_col)
    ax.set_ylabel(y_col)
    ax.set_title(title or f"{y_col} por {x_col} (agrupado por {group_col})")
    ax.set_xticks(x_pos)
    ax.set_xticklabels(unique_x, rotation=45, ha='right')
    ax.legend(bbox_to_anchor=(1.05, 1), loc='upper left')
    ax.grid(True, linestyle='--', alpha=0.7, axis='y')
    plt.tight_layout()

    logging.info(f"[GRAPH_GENERATION] ✅ Gráfico agrupado por cor criado: {len(unique_groups)} grupos")
    return save_plot_to_image()

async def _generate_dual_axis_chart(df: pd.DataFrame, title: str, colors, x_col: str, y1_col: str, y2_col: str) -> Optional[Image.Image]:
    """
    Gera gráfico com eixos duplos para métricas com escalas diferentes
    """
    logging.info(f"[GRAPH_GENERATION] 📊 Eixos duplos: {y1_col} (esq) + {y2_col} (dir)")

    fig, ax1 = plt.subplots(figsize=(14, 8))

    # Primeiro eixo Y (esquerda)
    x_pos = np.arange(len(df))
    width = 0.35

    bars1 = ax1.bar(x_pos - width/2, df[y1_col], width, label=y1_col,
                    color=colors[0], alpha=0.8)
    ax1.set_xlabel(x_col)
    ax1.set_ylabel(y1_col, color=colors[0])
    ax1.tick_params(axis='y', labelcolor=colors[0])

    # Segundo eixo Y (direita)
    ax2 = ax1.twinx()
    bars2 = ax2.bar(x_pos + width/2, df[y2_col], width, label=y2_col,
                    color=colors[1], alpha=0.8)
    ax2.set_ylabel(y2_col, color=colors[1])
    ax2.tick_params(axis='y', labelcolor=colors[1])

    # Configurações comuns
    ax1.set_xticks(x_pos)
    ax1.set_xticklabels(df[x_col], rotation=45, ha='right')
    ax1.grid(True, linestyle='--', alpha=0.7, axis='y')

    # Adicionar valores nas barras
    for bar in bars1:
        height = bar.get_height()
        if height > 0:
            ax1.text(bar.get_x() + bar.get_width()/2., height + height * 0.02,
                    f'{height:.0f}', ha='center', fontsize=8)

    for bar in bars2:
        height = bar.get_height()
        if height > 0:
            ax2.text(bar.get_x() + bar.get_width()/2., height + height * 0.02,
                    f'{height:.0f}', ha='center', fontsize=8)

    plt.title(title or f"{y1_col} e {y2_col} por {x_col}")
    plt.tight_layout()

    logging.info(f"[GRAPH_GENERATION] ✅ Gráfico com eixos duplos criado: {y1_col} + {y2_col}")
    return save_plot_to_image()

# Função removida - substituída pela nova lógica unificada

# Função removida - substituída pela nova lógica unificada em _generate_color_grouped_bars()

async def generate_bar_stacked(df: pd.DataFrame, title: str, colors) -> Optional[Image.Image]:
    """Gera gráfico de barras empilhadas"""
    if len(df.columns) < 3:
        return await generate_bar_vertical(df, title, colors)

    x_col = df.columns[0]
    y_cols = [col for col in df.columns[1:] if pd.api.types.is_numeric_dtype(df[col])]

    if not y_cols:
        return await generate_bar_vertical(df, title, colors)

    fig, ax = plt.subplots(figsize=(12, 8))
    bottom = np.zeros(len(df))

    for i, col in enumerate(y_cols):
        bars = ax.bar(range(len(df)), df[col], bottom=bottom, label=col, color=colors[i % len(colors)])

        # Adicionar valores nas barras
        for j, bar in enumerate(bars):
            height = bar.get_height()
            if isinstance(height, (int, float)) and height > 0:
                ax.text(bar.get_x() + bar.get_width()/2., bottom[j] + height/2,
                        f'{height:.2f}', ha='center', va='center', fontsize=8, color='white')

        bottom += df[col].fillna(0)

    ax.set_xlabel(x_col)
    ax.set_ylabel('Valores')
    ax.set_title(title or f"Distribuição por {x_col}")
    ax.set_xticks(range(len(df)))
    ax.set_xticklabels(df[x_col], rotation=45, ha='right')
    ax.legend()
    plt.tight_layout()

    return save_plot_to_image()

async def generate_pie(df: pd.DataFrame, title: str, colors) -> Optional[Image.Image]:
    """Gera gráfico de pizza"""
    if len(df.columns) < 2:
        return None

    label_col, value_col = df.columns[0], df.columns[1]

    # Preparar dados numéricos - converter strings com vírgula para float
    df_plot = df.copy()
    try:
        if df_plot[value_col].dtype == 'object':
            # Converte strings para números, tratando vírgulas como separador decimal
            df_plot[value_col] = pd.to_numeric(df_plot[value_col].astype(str).str.replace(',', '.'), errors='coerce')

        # Remove linhas com valores não numéricos, negativos ou zero
        df_plot = df_plot.dropna(subset=[value_col])
        df_plot = df_plot[df_plot[value_col] > 0]

        if df_plot.empty:
            logging.error(f"[GRAPH_GENERATION] Nenhum valor numérico positivo encontrado na coluna {value_col}")
            return await generate_bar_vertical(df, title, colors)

    except Exception as e:
        logging.error(f"[GRAPH_GENERATION] Erro ao converter dados para numérico: {e}")
        return await generate_bar_vertical(df, title, colors)

    plt.figure(figsize=(10, 10))

    # Calcular percentuais para os rótulos
    total = df_plot[value_col].sum()
    labels = [f'{label} ({val:,.0f}, {val/total:.1%})' for label, val in zip(df_plot[label_col], df_plot[value_col])]

    plt.pie(df_plot[value_col], labels=labels, autopct='%1.1f%%',
            startangle=90, shadow=False, colors=colors[:len(df_plot)])

    plt.axis('equal')
    plt.title(title or f"Distribuição de {value_col} por {label_col}")
    plt.tight_layout()

    return save_plot_to_image()

async def generate_donut(df: pd.DataFrame, title: str, colors) -> Optional[Image.Image]:
    """Gera gráfico de donut"""
    if len(df.columns) < 2:
        return None

    label_col, value_col = df.columns[0], df.columns[1]

    # Preparar dados numéricos - converter strings com vírgula para float
    df_plot = df.copy()
    try:
        if df_plot[value_col].dtype == 'object':
            # Converte strings para números, tratando vírgulas como separador decimal
            df_plot[value_col] = pd.to_numeric(df_plot[value_col].astype(str).str.replace(',', '.'), errors='coerce')

        # Remove linhas com valores não numéricos, negativos ou zero
        df_plot = df_plot.dropna(subset=[value_col])
        df_plot = df_plot[df_plot[value_col] > 0]

        if df_plot.empty:
            logging.error(f"[GRAPH_GENERATION] Nenhum valor numérico positivo encontrado na coluna {value_col}")
            return await generate_bar_vertical(df, title, colors)

    except Exception as e:
        logging.error(f"[GRAPH_GENERATION] Erro ao converter dados para numérico: {e}")
        return await generate_bar_vertical(df, title, colors)

    plt.figure(figsize=(10, 10))

    # Calcular percentuais para os rótulos
    total = df_plot[value_col].sum()
    labels = [f'{label} ({val:,.0f}, {val/total:.1%})' for label, val in zip(df_plot[label_col], df_plot[value_col])]

    # Criar gráfico de donut (pizza com círculo central)
    plt.pie(df_plot[value_col], labels=labels, autopct='%1.1f%%',
            startangle=90, shadow=False, colors=colors[:len(df_plot)],
            wedgeprops=dict(width=0.5))  # Largura do anel

    plt.axis('equal')
    plt.title(title or f"Distribuição de {value_col} por {label_col}")
    plt.tight_layout()

    return save_plot_to_image()

async def generate_pie_multiple(df: pd.DataFrame, title: str, colors) -> Optional[Image.Image]:
    """Gera múltiplos gráficos de pizza"""
    if len(df.columns) < 3:
        return await generate_pie(df, title, colors)

    cat1, cat2, val_col = df.columns[0], df.columns[1], df.columns[2]

    # Verificar se o valor é numérico
    if not pd.api.types.is_numeric_dtype(df[val_col]):
        return await generate_bar_grouped(df, title, colors)

    # Agrupar dados
    grouped = df.groupby([cat1, cat2])[val_col].sum().unstack().fillna(0)

    # Determinar layout da grade
    n_groups = len(grouped)
    if n_groups == 0:
        return None

    cols = min(3, n_groups)  # Máximo 3 colunas
    rows = (n_groups + cols - 1) // cols  # Arredondar para cima

    # Criar subplots
    fig, axes = plt.subplots(rows, cols, figsize=(15, 5 * rows))
    if rows == 1 and cols == 1:
        axes = np.array([axes])  # Garantir que axes seja um array
    axes = axes.flatten()

    # Plotar cada pizza
    for i, (group_name, group_data) in enumerate(grouped.iterrows()):
        if i < len(axes):
            # Remover valores zero
            data = group_data[group_data > 0]

            if not data.empty:
                # Calcular percentuais
                total = data.sum()

                # Criar rótulos com valores e percentuais
                labels = [f'{idx} ({val:.2f}, {val/total:.1%})' for idx, val in data.items()]

                # Plotar pizza
                axes[i].pie(data, labels=labels, autopct='%1.1f%%',
                           startangle=90, colors=colors[:len(data)])
                axes[i].set_title(f"{group_name}")
                axes[i].axis('equal')

    # Esconder eixos não utilizados
    for j in range(i + 1, len(axes)):
        axes[j].axis('off')

    plt.suptitle(title or f"Distribuição de {val_col} por {cat2} para cada {cat1}", fontsize=16)
    plt.tight_layout()
    plt.subplots_adjust(top=0.9)

    return save_plot_to_image()