#!/usr/bin/env python3 """ Aplicação Gradio para Análise Geoespacial - VERSÃO MELHORADA (UI + ZIP) Melhorias solicitadas: - Legendas nos gráficos (Matplotlib) e mapas (Folium) - Mapas interativos e mapas com grid passam a ser exibidos corretamente na interface (via iframe com srcdoc) - Todo output gerado é salvo e pode ser baixado em um único ZIP EXECUTAR: python3.11 app_melhorado_v3.py (ou python app_melhorado_v3.py) ACESSAR: http://localhost:7860 """ import gradio as gr import geopandas as gpd import pandas as pd import numpy as np import matplotlib.pyplot as plt import seaborn as sns import folium from folium import plugins import matplotlib.colors as mcolors from sklearn.cluster import KMeans, DBSCAN from sklearn.preprocessing import StandardScaler import warnings from datetime import datetime import tempfile import os from pathlib import Path import zipfile import html as _html warnings.filterwarnings('ignore') # Configurar estilo (mantido) sns.set_style("whitegrid") plt.rcParams['figure.figsize'] = (12, 8) plt.rcParams['font.size'] = 10 # ============================================================================ # VARIÁVEIS GLOBAIS # ============================================================================ buildings_gdf = None highways_gdf = None grid_gdf = None # Sessão atual de outputs (para ZIP) CURRENT_SESSION_DIR = None # Pasta de outputs (DEVE ficar dentro do diretório de trabalho para o Gradio aceitar downloads) # Pasta de outputs # - Em Hugging Face Spaces, é seguro escrever em /tmp (recomendado) e também no diretório do app. # - Para evitar erros de permissões/paths, usamos /tmp por padrão quando disponível. OUTPUT_ROOT = Path(os.environ.get('GEO_OUTPUT_ROOT', Path(tempfile.gettempdir()) / 'geospatial_downloads')) OUTPUT_ROOT.mkdir(parents=True, exist_ok=True) # ============================================================================ # HELPERS (ZIP + EMBED) # ============================================================================ def _ensure_session_dir(): """Cria (uma vez) a pasta de outputs da sessão atual.""" global CURRENT_SESSION_DIR if CURRENT_SESSION_DIR is None: ts = datetime.now().strftime("%Y%m%d_%H%M%S") CURRENT_SESSION_DIR = OUTPUT_ROOT / f"session_{ts}" CURRENT_SESSION_DIR.mkdir(parents=True, exist_ok=True) return CURRENT_SESSION_DIR def _save_text(name: str, content: str) -> str: """Salva texto na sessão e devolve o caminho.""" session_dir = _ensure_session_dir() fp = session_dir / name fp.write_text(content, encoding="utf-8") return str(fp) def _save_gpkg(name: str, gdf: gpd.GeoDataFrame, layer: str = "data") -> str: """Salva um GeoDataFrame em GPKG na sessão e devolve o caminho.""" session_dir = _ensure_session_dir() fp = session_dir / name # garante extensão .gpkg if fp.suffix.lower() != ".gpkg": fp = fp.with_suffix(".gpkg") # escreve (sempre sobrescreve) gdf.to_file(fp, layer=layer, driver="GPKG") return str(fp) def _copy_into_session(src_path: str, name: str | None = None) -> str: """Copia um arquivo gerado (tmp) para a pasta da sessão e devolve o novo caminho.""" session_dir = _ensure_session_dir() src = Path(src_path) dst = session_dir / (name or src.name) # leitura/escrita binária para evitar problemas cross-platform dst.write_bytes(src.read_bytes()) return str(dst) def _make_zip() -> str | None: """Empacota TODO o conteúdo da sessão em um ZIP e devolve o caminho.""" session_dir = _ensure_session_dir() # se ainda não há nada, retorna None if not any(session_dir.iterdir()): return None zip_path = session_dir.with_suffix(".zip") with zipfile.ZipFile(zip_path, "w", compression=zipfile.ZIP_DEFLATED) as z: for p in session_dir.rglob("*"): if p.is_file(): z.write(p, arcname=str(p.relative_to(session_dir))) return str(zip_path) def _iframe_srcdoc(html_content: str, height: int = 650) -> str: """ Garante exibição consistente de mapas Folium no Gradio. Usa iframe com srcdoc e HTML escapado. """ escaped = _html.escape(html_content, quote=True) return f"""
""" def _add_folium_legend(m: folium.Map, title: str, items: list[tuple[str, str]]): """ Adiciona legenda simples no canto do mapa (HTML overlay). items: [(label, color), ...] """ rows = "\n".join( [f"
" f"" f"{_html.escape(str(l))}" f"
" for l, c in items] ) legend_html = f"""
{_html.escape(title)}
{rows}
""" m.get_root().html.add_child(folium.Element(legend_html)) def create_zip_for_download(): """Gera/atualiza o ZIP com TODOS os outputs da sessão e devolve o caminho.""" try: zp = _make_zip() if zp is None: return '⚠️ Ainda não há outputs nesta sessão para empacotar.', None from pathlib import Path as _P return f'📦 ZIP gerado: {_P(zp).name}', zp except Exception as e: return f'❌ Erro ao gerar ZIP: {e}', None # ============================================================================ # FUNÇÕES DE PROCESSAMENTO # ============================================================================ def load_data(buildings_file, highways_file): """Carrega os arquivos GPKG""" global buildings_gdf, highways_gdf, grid_gdf, CURRENT_SESSION_DIR try: if buildings_file is None or highways_file is None: return "❌ Por favor, carregue ambos os arquivos (edifícios e ruas)", None # reset de sessão a cada novo carregamento (para zip limpo) CURRENT_SESSION_DIR = None grid_gdf = None buildings_gdf = gpd.read_file(buildings_file) highways_gdf = gpd.read_file(highways_file) # Reprojetar para UTM (mantido) buildings_gdf = buildings_gdf.to_crs(epsg=32632) highways_gdf = highways_gdf.to_crs(epsg=32632) # Calcular métricas básicas (mantido) buildings_gdf['area_m2'] = buildings_gdf.geometry.area buildings_gdf['perimeter_m'] = buildings_gdf.geometry.length highways_gdf['length_m'] = highways_gdf.geometry.length msg = f"""✓ Dados carregados com sucesso! 📊 EDIFÍCIOS: {len(buildings_gdf):,} registros • Área total: {buildings_gdf['area_m2'].sum():,.0f} m² • Área média: {buildings_gdf['area_m2'].mean():.0f} m² 📊 RUAS: {len(highways_gdf):,} registros • Comprimento total: {highways_gdf['length_m'].sum():,.0f} m ({highways_gdf['length_m'].sum()/1000:,.1f} km) • Comprimento médio: {highways_gdf['length_m'].mean():.0f} m 📍 Sistema de Coordenadas: {buildings_gdf.crs} ⏰ Data de Carregamento: {datetime.now().strftime('%Y-%m-%d %H:%M:%S')} """ # salvar outputs base _save_text("status_carregamento.txt", msg) return msg except Exception as e: return f"❌ Erro ao carregar dados: {str(e)}" def exploratory_analysis(): """Análise exploratória básica""" global buildings_gdf, highways_gdf if buildings_gdf is None or highways_gdf is None: return "❌ Carregue os dados primeiro" try: report = f""" ╔════════════════════════════════════════════════════════════════╗ ║ ANÁLISE EXPLORATÓRIA - EDIFÍCIOS ║ ╚════════════════════════════════════════════════════════════════╝ 📐 ÁREA DOS EDIFÍCIOS (m²): Total: {buildings_gdf['area_m2'].sum():,.0f} m² Média: {buildings_gdf['area_m2'].mean():,.0f} m² Mediana: {buildings_gdf['area_m2'].median():,.0f} m² Mínima: {buildings_gdf['area_m2'].min():,.0f} m² Máxima: {buildings_gdf['area_m2'].max():,.0f} m² Desvio Padrão: {buildings_gdf['area_m2'].std():,.0f} m² Q1 (25%): {buildings_gdf['area_m2'].quantile(0.25):,.0f} m² Q3 (75%): {buildings_gdf['area_m2'].quantile(0.75):,.0f} m² 📏 PERÍMETRO DOS EDIFÍCIOS (m): Média: {buildings_gdf['perimeter_m'].mean():,.0f} m Mediana: {buildings_gdf['perimeter_m'].median():,.0f} m Máxima: {buildings_gdf['perimeter_m'].max():,.0f} m ╔════════════════════════════════════════════════════════════════╗ ║ ANÁLISE EXPLORATÓRIA - RUAS ║ ╚════════════════════════════════════════════════════════════════╝ 🛣️ COMPRIMENTO DAS RUAS (m): Total: {highways_gdf['length_m'].sum():,.0f} m ({highways_gdf['length_m'].sum()/1000:,.1f} km) Média: {highways_gdf['length_m'].mean():,.0f} m Mediana: {highways_gdf['length_m'].median():,.0f} m Mínima: {highways_gdf['length_m'].min():,.0f} m Máxima: {highways_gdf['length_m'].max():,.0f} m Desvio Padrão: {highways_gdf['length_m'].std():,.0f} m Q1 (25%): {highways_gdf['length_m'].quantile(0.25):,.0f} m Q3 (75%): {highways_gdf['length_m'].quantile(0.75):,.0f} m ╔════════════════════════════════════════════════════════════════╗ ║ TIPOS DE EDIFÍCIOS (TOP 15) ║ ╚════════════════════════════════════════════════════════════════╝ """ if 'building' in buildings_gdf.columns: building_types = buildings_gdf['building'].value_counts().head(15) for i, (btype, count) in enumerate(building_types.items(), 1): pct = (count / len(buildings_gdf)) * 100 bar = "█" * int(pct / 2) report += f"\n{i:2d}. {str(btype):20s}: {count:6d} ({pct:5.1f}%) {bar}" report += f""" ╔════════════════════════════════════════════════════════════════╗ ║ TIPOS DE RUAS (TOP 15) ║ ╚════════════════════════════════════════════════════════════════╝ """ if 'highway' in highways_gdf.columns: highway_types = highways_gdf['highway'].value_counts().head(15) for i, (htype, count) in enumerate(highway_types.items(), 1): pct = (count / len(highways_gdf)) * 100 bar = "█" * int(pct / 2) report += f"\n{i:2d}. {str(htype):30s}: {count:6d} ({pct:5.1f}%) {bar}" # salvar relatório _save_text("relatorio_eda.txt", report) return report except Exception as e: return f"❌ Erro na análise: {str(e)}" def create_distributions(): """Cria gráficos de distribuição (com legendas)""" global buildings_gdf, highways_gdf if buildings_gdf is None or highways_gdf is None: return None try: fig, axes = plt.subplots(2, 2, figsize=(14, 10)) fig.suptitle('Distribuições - Edifícios e Ruas', fontsize=16, fontweight='bold') # Histograma área axes[0, 0].hist(buildings_gdf['area_m2'], bins=50, edgecolor='black', alpha=0.7, color='steelblue', label='Edifícios (área)') axes[0, 0].set_xlabel('Área (m²)') axes[0, 0].set_ylabel('Frequência') axes[0, 0].set_title('Distribuição de Áreas de Edifícios') axes[0, 0].set_yscale('log') axes[0, 0].grid(True, alpha=0.3) axes[0, 0].legend(loc='upper right') # Boxplot área buildings_gdf.boxplot(column='area_m2', ax=axes[0, 1]) axes[0, 1].set_ylabel('Área (m²)') axes[0, 1].set_title('Box Plot - Áreas de Edifícios') axes[0, 1].set_yscale('log') axes[0, 1].grid(True, alpha=0.3) # legenda simples axes[0, 1].plot([], [], label='Edifícios (área)', color='black') axes[0, 1].legend(loc='upper right') # Histograma ruas axes[1, 0].hist(highways_gdf['length_m'], bins=50, edgecolor='black', alpha=0.7, color='coral', label='Ruas (comprimento)') axes[1, 0].set_xlabel('Comprimento (m)') axes[1, 0].set_ylabel('Frequência') axes[1, 0].set_title('Distribuição de Comprimentos de Ruas') axes[1, 0].set_yscale('log') axes[1, 0].grid(True, alpha=0.3) axes[1, 0].legend(loc='upper right') # Boxplot ruas highways_gdf.boxplot(column='length_m', ax=axes[1, 1]) axes[1, 1].set_ylabel('Comprimento (m)') axes[1, 1].set_title('Box Plot - Comprimentos de Ruas') axes[1, 1].set_yscale('log') axes[1, 1].grid(True, alpha=0.3) axes[1, 1].plot([], [], label='Ruas (comprimento)', color='black') axes[1, 1].legend(loc='upper right') plt.tight_layout() # Salvar em arquivo temporário e copiar para sessão with tempfile.NamedTemporaryFile(suffix='.png', delete=False) as tmp: plt.savefig(tmp.name, format='png', dpi=120, bbox_inches='tight') plt.close() out_path = _copy_into_session(tmp.name, "graficos_distribuicoes.png") return out_path except Exception as e: print(f"Erro: {e}") return None def create_types_charts(): """Cria gráficos de tipos (com legendas)""" global buildings_gdf, highways_gdf if buildings_gdf is None or highways_gdf is None: return None try: fig, axes = plt.subplots(1, 2, figsize=(16, 6)) fig.suptitle('Tipos de Edifícios e Ruas', fontsize=16, fontweight='bold') if 'building' in buildings_gdf.columns: building_types = buildings_gdf['building'].value_counts().head(15) building_types.plot(kind='barh', ax=axes[0], color='steelblue', label='Quantidade') axes[0].set_xlabel('Quantidade') axes[0].set_title('Top 15 Tipos de Edifícios') axes[0].grid(True, alpha=0.3, axis='x') axes[0].legend(loc='lower right') if 'highway' in highways_gdf.columns: highway_types = highways_gdf['highway'].value_counts().head(15) highway_types.plot(kind='barh', ax=axes[1], color='coral', label='Quantidade') axes[1].set_xlabel('Quantidade') axes[1].set_title('Top 15 Tipos de Ruas') axes[1].grid(True, alpha=0.3, axis='x') axes[1].legend(loc='lower right') plt.tight_layout() with tempfile.NamedTemporaryFile(suffix='.png', delete=False) as tmp: plt.savefig(tmp.name, format='png', dpi=120, bbox_inches='tight') plt.close() out_path = _copy_into_session(tmp.name, "graficos_tipos.png") return out_path except Exception as e: print(f"Erro: {e}") return None def spatial_analysis(): """Análise espacial com clustering + gráficos explicativos""" global buildings_gdf, highways_gdf, grid_gdf if buildings_gdf is None or highways_gdf is None: return "❌ Carregue os dados primeiro" try: # Grid grid_size = 500 minx, miny, maxx, maxy = buildings_gdf.total_bounds cols = np.arange(minx, maxx + grid_size, grid_size) rows = np.arange(miny, maxy + grid_size, grid_size) cells = [] cell_ids = [] cell_id = 0 from shapely.geometry import box for i in range(len(cols) - 1): for j in range(len(rows) - 1): cells.append(box(cols[i], rows[j], cols[i + 1], rows[j + 1])) cell_ids.append(cell_id) cell_id += 1 grid_gdf = gpd.GeoDataFrame({"cell_id": cell_ids, "geometry": cells}, crs=buildings_gdf.crs) buildings_in_grid = gpd.sjoin(buildings_gdf, grid_gdf, how="left", predicate="intersects") building_counts = buildings_in_grid.groupby("cell_id").size() grid_gdf["building_count"] = grid_gdf["cell_id"].map(building_counts).fillna(0).astype(int) cell_area_ha = (grid_size * grid_size) / 10000.0 # hectares grid_gdf["building_density"] = grid_gdf["building_count"] / cell_area_ha grid_gdf_active = grid_gdf[grid_gdf["building_count"] > 0].copy() # Clustering (usa centroides em WGS84 para estabilidade visual) b_wgs = buildings_gdf.to_crs(epsg=4326).copy() coords = np.column_stack([b_wgs.geometry.centroid.y.values, b_wgs.geometry.centroid.x.values]) scaler = StandardScaler() coords_scaled = scaler.fit_transform(coords) kmeans = KMeans(n_clusters=5, random_state=42, n_init=10) buildings_gdf["cluster_kmeans"] = kmeans.fit_predict(coords_scaled) dbscan = DBSCAN(eps=0.05, min_samples=10) buildings_gdf["cluster_dbscan"] = dbscan.fit_predict(coords_scaled) n_clusters_dbscan = len(set(buildings_gdf["cluster_dbscan"])) - (1 if -1 in buildings_gdf["cluster_dbscan"] else 0) n_noise = int((buildings_gdf["cluster_dbscan"] == -1).sum()) report = f""" ╔════════════════════════════════════════════════════════════════╗ ║ ANÁLISE ESPACIAL - GRID DE DENSIDADE ║ ╚════════════════════════════════════════════════════════════════╝ 📊 GRID (500m x 500m): Total de células: {len(grid_gdf)} Células com edifícios: {len(grid_gdf_active)} Cobertura: {(len(grid_gdf_active)/len(grid_gdf)*100):.1f}% 📈 DENSIDADE DE EDIFÍCIOS (edifícios/hectare): Média: {grid_gdf_active['building_density'].mean():.2f} Mediana: {grid_gdf_active['building_density'].median():.2f} Máxima: {grid_gdf_active['building_density'].max():.2f} Mínima: {grid_gdf_active['building_density'].min():.2f} ╔════════════════════════════════════════════════════════════════╗ ║ ANÁLISE ESPACIAL - CLUSTERING K-MEANS ║ ╚════════════════════════════════════════════════════════════════╝ 🎯 CLUSTERING K-MEANS (k=5): Total de edifícios: {len(buildings_gdf)} Clusters: {buildings_gdf['cluster_kmeans'].nunique()} Distribuição por cluster (K-Means): """ cluster_counts = buildings_gdf["cluster_kmeans"].value_counts().sort_index() total_buildings = len(buildings_gdf) for cluster, count in cluster_counts.items(): pct = (count / total_buildings) * 100 bar = "█" * int(pct / 2) # tenta usar área se existir area = 0.0 try: area = float(buildings_gdf.loc[buildings_gdf["cluster_kmeans"] == cluster, "area_m2"].sum()) except Exception: area = 0.0 report += f"\n Cluster {cluster}: {count:6d} edifícios ({pct:5.1f}%) {bar}" if area > 0: report += f" - {area:,.0f} m² de área" report += f""" ╔════════════════════════════════════════════════════════════════╗ ║ ANÁLISE ESPACIAL - CLUSTERING DBSCAN ║ ╚════════════════════════════════════════════════════════════════╝ 🎯 CLUSTERING DBSCAN: Clusters encontrados: {n_clusters_dbscan} Pontos de ruído: {n_noise} ({(n_noise/len(buildings_gdf))*100:.1f}%) """ # === Gráficos (para explicar os dados) === fig = plt.figure(figsize=(12, 8)) ax1 = fig.add_subplot(2, 2, 1) ax2 = fig.add_subplot(2, 2, 2) ax3 = fig.add_subplot(2, 2, 3) ax4 = fig.add_subplot(2, 2, 4) dens = grid_gdf_active["building_density"].replace([np.inf, -np.inf], np.nan).dropna() ax1.hist(dens, bins=30) ax1.set_title("Distribuição da densidade (edifícios/ha)") ax1.set_xlabel("edifícios/ha") ax1.set_ylabel("freq.") ax1.grid(True, alpha=0.3) top = grid_gdf_active.sort_values("building_density", ascending=False).head(10) ax2.bar(top["cell_id"].astype(str), top["building_density"]) ax2.set_title("Top 10 células por densidade") ax2.set_xlabel("cell_id") ax2.set_ylabel("edifícios/ha") ax2.tick_params(axis="x", rotation=45) ax2.grid(True, alpha=0.3) km_counts = buildings_gdf["cluster_kmeans"].value_counts().sort_index() ax3.bar(km_counts.index.astype(str), km_counts.values) ax3.set_title("K-Means: contagem por cluster") ax3.set_xlabel("cluster") ax3.set_ylabel("n edifícios") ax3.grid(True, alpha=0.3) db_counts = buildings_gdf["cluster_dbscan"].value_counts().sort_index() ax4.bar(db_counts.index.astype(str), db_counts.values) ax4.set_title("DBSCAN: contagem por rótulo (-1 = ruído)") ax4.set_xlabel("rótulo") ax4.set_ylabel("n edifícios") ax4.grid(True, alpha=0.3) fig.tight_layout() # Salva outputs adicionais _save_text("relatorio_espacial.txt", report) try: session_dir = _ensure_session_dir() fig_path = session_dir / "graficos_analise_espacial.png" fig.savefig(fig_path, dpi=160, bbox_inches="tight") except Exception: pass # Salva GPKG correspondentes (objetos que originam mapas) try: _save_gpkg("grid_500m.gpkg", grid_gdf, layer="grid") except Exception: pass try: _save_gpkg("edificios_com_clusters.gpkg", buildings_gdf, layer="buildings") except Exception: pass return report, fig except Exception as e: return f"❌ Erro na análise espacial: {str(e)}", None def create_heatmap(): """Cria mapa de calor (exibido via iframe + salvo)""" global buildings_gdf if buildings_gdf is None: return None, None, None try: buildings_wgs84 = buildings_gdf.to_crs(epsg=4326) center_lat = buildings_wgs84.geometry.centroid.y.mean() center_lon = buildings_wgs84.geometry.centroid.x.mean() # GPKG base: pontos (WGS84) + colunas de cluster (se existirem) kmeans_gdf = buildings_wgs84.copy() dbscan_gdf = buildings_wgs84.copy() if 'cluster_kmeans' in buildings_gdf.columns and 'cluster_kmeans' not in kmeans_gdf.columns: kmeans_gdf['cluster_kmeans'] = buildings_gdf['cluster_kmeans'].values if 'cluster_dbscan' in buildings_gdf.columns and 'cluster_dbscan' not in dbscan_gdf.columns: dbscan_gdf['cluster_dbscan'] = buildings_gdf['cluster_dbscan'].values m = folium.Map(location=[center_lat, center_lon], zoom_start=12, tiles='OpenStreetMap') heat_data = [] for _, row in buildings_wgs84.iterrows(): centroid = row.geometry.centroid heat_data.append([centroid.y, centroid.x]) plugins.HeatMap(heat_data, radius=15, blur=25, max_zoom=13).add_to(m) # legenda _add_folium_legend( m, "Mapa de Calor (Edifícios)", [("Intensidade = concentração de pontos", "#ef4444")] ) # salvar html with tempfile.NamedTemporaryFile(suffix='.html', delete=False, mode='w', encoding='utf-8') as tmp: m.save(tmp.name) html_content = Path(tmp.name).read_text(encoding="utf-8") out_path = _copy_into_session(tmp.name, "mapa_heatmap.html") # Salva GPKG correspondente (pontos usados no heatmap) gpkg_path = None try: gpkg_path = _save_gpkg("heatmap_pontos.gpkg", buildings_wgs84, layer="heatmap_points") except Exception: gpkg_path = None return _iframe_srcdoc(html_content, height=650), out_path, gpkg_path except Exception as e: print(f"Erro: {e}") return None, None, None def create_clustering_maps(): """Cria mapas de clustering (K-Means e DBSCAN) com legenda. Observação: para performance, o mapa pode usar amostragem visual quando há muitos pontos. Os GPKGs salvos contêm TODOS os pontos (sem amostragem). """ global buildings_gdf if buildings_gdf is None or len(buildings_gdf) == 0: return None, None, None, None, None, None try: # Trabalha em WGS84 para mapas buildings_wgs84 = buildings_gdf.to_crs(epsg=4326).copy() # Centróides (uma vez) centroids = buildings_wgs84.geometry.centroid buildings_wgs84["_lat"] = centroids.y.values buildings_wgs84["_lon"] = centroids.x.values center_lat = float(buildings_wgs84["_lat"].mean()) center_lon = float(buildings_wgs84["_lon"].mean()) # Garante colunas de cluster (para o GPKG e para o mapa) coords = np.column_stack([buildings_wgs84["_lat"].values, buildings_wgs84["_lon"].values]) coords_scaled = StandardScaler().fit_transform(coords) if "cluster_kmeans" not in buildings_gdf.columns: kmeans = KMeans(n_clusters=5, random_state=42, n_init=10) buildings_gdf["cluster_kmeans"] = kmeans.fit_predict(coords_scaled) if "cluster_dbscan" not in buildings_gdf.columns: dbscan = DBSCAN(eps=0.05, min_samples=10) buildings_gdf["cluster_dbscan"] = dbscan.fit_predict(coords_scaled) # Copias em WGS84 (para salvar e para mapear) kmeans_gdf = buildings_wgs84.copy() dbscan_gdf = buildings_wgs84.copy() kmeans_gdf["cluster_kmeans"] = buildings_gdf["cluster_kmeans"].values dbscan_gdf["cluster_dbscan"] = buildings_gdf["cluster_dbscan"].values # --------- AMOSTRAGEM VISUAL (para o HTML não travar) ---------- MAX_POINTS_MAP = 15000 def _sample_for_map(gdf, label_col=None): if len(gdf) <= MAX_POINTS_MAP: return gdf if label_col and label_col in gdf.columns: # amostragem estratificada por rótulo parts = [] groups = gdf.groupby(label_col, dropna=False) # distribui a cota proporcionalmente for _, grp in groups: n = max(1, int(len(grp) / len(gdf) * MAX_POINTS_MAP)) parts.append(grp.sample(n=min(n, len(grp)), random_state=42)) out = pd.concat(parts, ignore_index=True) # se ainda excedeu, corta if len(out) > MAX_POINTS_MAP: out = out.sample(n=MAX_POINTS_MAP, random_state=42) return out # fallback: amostra simples return gdf.sample(n=MAX_POINTS_MAP, random_state=42) kmeans_map_gdf = _sample_for_map(kmeans_gdf, "cluster_kmeans") dbscan_map_gdf = _sample_for_map(dbscan_gdf, "cluster_dbscan") # ----------------- KMEANS MAP ----------------- m1 = folium.Map(location=[center_lat, center_lon], zoom_start=12, tiles="OpenStreetMap") colors = ["red", "blue", "green", "purple", "orange"] # usa loop apenas na amostra (mais leve) for _, row in kmeans_map_gdf.iterrows(): cluster = int(row.get("cluster_kmeans", 0)) color = colors[cluster % len(colors)] folium.CircleMarker( location=[float(row["_lat"]), float(row["_lon"])], radius=3, color=color, fill=True, fillColor=color, fillOpacity=0.6, weight=1, ).add_to(m1) _add_folium_legend( m1, "K-Means (clusters)", [(f"Cluster {i}", colors[i % len(colors)]) for i in range(5)], ) # ----------------- DBSCAN MAP ----------------- m2 = folium.Map(location=[center_lat, center_lon], zoom_start=12, tiles="OpenStreetMap") # nº clusters (ignorando ruído -1) labels = dbscan_gdf["cluster_dbscan"].values n_clusters_dbscan = len(set(labels)) - (1 if -1 in labels else 0) cmap = plt.cm.tab20(np.linspace(0, 1, max(n_clusters_dbscan, 1))) for _, row in dbscan_map_gdf.iterrows(): cluster = int(row.get("cluster_dbscan", -1)) if cluster == -1: color = "gray" opacity = 0.3 else: color = mcolors.rgb2hex(cmap[cluster % max(n_clusters_dbscan, 1)]) opacity = 0.7 folium.CircleMarker( location=[float(row["_lat"]), float(row["_lon"])], radius=3, color=color, fill=True, fillColor=color, fillOpacity=opacity, weight=1, ).add_to(m2) legend_items = [("Ruído (-1)", "gray")] # amostra (até 8 itens) para não explodir a legenda for i in range(min(n_clusters_dbscan, 8)): legend_items.append((f"Cluster {i}", mcolors.rgb2hex(cmap[i % max(n_clusters_dbscan, 1)]))) _add_folium_legend(m2, "DBSCAN (clusters)", legend_items) # salvar htmls (sempre copiando para a pasta da sessão) with tempfile.NamedTemporaryFile(suffix=".html", delete=False, mode="w", encoding="utf-8") as tmp1: m1.save(tmp1.name) kmeans_html = Path(tmp1.name).read_text(encoding="utf-8") kmeans_file = _copy_into_session(tmp1.name, "mapa_kmeans.html") with tempfile.NamedTemporaryFile(suffix=".html", delete=False, mode="w", encoding="utf-8") as tmp2: m2.save(tmp2.name) dbscan_html = Path(tmp2.name).read_text(encoding="utf-8") dbscan_file = _copy_into_session(tmp2.name, "mapa_dbscan.html") # Salva GPKG correspondentes (TODOS os pontos + rótulos) kmeans_gpkg = None dbscan_gpkg = None try: kmeans_gpkg = _save_gpkg("kmeans_pontos_clusters.gpkg", kmeans_gdf.drop(columns=["_lat","_lon"], errors="ignore"), layer="kmeans") except Exception: kmeans_gpkg = None try: dbscan_gpkg = _save_gpkg("dbscan_pontos_clusters.gpkg", dbscan_gdf.drop(columns=["_lat","_lon"], errors="ignore"), layer="dbscan") except Exception: dbscan_gpkg = None return kmeans_html, kmeans_file, dbscan_html, dbscan_file, kmeans_gpkg, dbscan_gpkg except Exception as e: print(f"Erro em create_clustering_maps: {e}") return None, None, None, None, None, None def create_grid_maps(): """Cria mapas com grid (exibidos via iframe + salvos)""" global buildings_gdf, highways_gdf, grid_gdf if buildings_gdf is None or grid_gdf is None or highways_gdf is None: return None, None, None, None, None, None try: grid_wgs84 = grid_gdf.to_crs(epsg=4326) buildings_wgs84 = buildings_gdf.to_crs(epsg=4326) highways_wgs84 = highways_gdf.to_crs(epsg=4326) center_lat = buildings_wgs84.geometry.centroid.y.mean() center_lon = buildings_wgs84.geometry.centroid.x.mean() # Mapa 1: Densidade de edifícios m1 = folium.Map(location=[center_lat, center_lon], zoom_start=12, tiles='OpenStreetMap') # bins e legenda (mantém suas cores, só adiciona legenda) legend_buildings = [ ("0", "white"), ("< 2", "#ffffcc"), ("2–4", "#ffeda0"), ("4–6", "#fed976"), ("6–8", "#feb24c"), ("8–10", "#fd8d3c"), (">= 10", "#e31a1c"), ] for idx, row in grid_wgs84.iterrows(): density = float(grid_gdf.loc[idx, 'building_density']) if density == 0: color = 'white' opacity = 0 elif density < 2: color = '#ffffcc' opacity = 0.3 elif density < 4: color = '#ffeda0' opacity = 0.4 elif density < 6: color = '#fed976' opacity = 0.5 elif density < 8: color = '#feb24c' opacity = 0.6 elif density < 10: color = '#fd8d3c' opacity = 0.7 else: color = '#e31a1c' opacity = 0.8 folium.GeoJson( data=row.geometry.__geo_interface__, style_function=lambda _, color=color, opacity=opacity: { 'fillColor': color, 'color': 'black', 'weight': 0.5, 'fillOpacity': opacity } ).add_to(m1) _add_folium_legend(m1, "Densidade de edifícios (por ha)", legend_buildings) # Mapa 2: Densidade de ruas m2 = folium.Map(location=[center_lat, center_lon], zoom_start=12, tiles='OpenStreetMap') roads_per_cell = [] for cell in grid_gdf.geometry: roads_in_cell = highways_gdf[highways_gdf.geometry.intersects(cell)] roads_per_cell.append(float(roads_in_cell['length_m'].sum()) if len(roads_in_cell) > 0 else 0.0) grid_gdf['road_density'] = np.array(roads_per_cell) / (500 ** 2) * 10000 max_road_density = float(grid_gdf['road_density'].max()) if float(grid_gdf['road_density'].max()) > 0 else 1.0 legend_roads = [ ("0", "white"), ("Baixa", "#f7fbff"), ("Média-baixa", "#deebf7"), ("Média", "#9ecae1"), ("Média-alta", "#3182bd"), ("Alta", "#08519c"), ] for idx, row in grid_wgs84.iterrows(): road_density = float(grid_gdf.loc[idx, 'road_density']) if road_density == 0: color = 'white' opacity = 0 else: intensity = road_density / max_road_density if intensity < 0.2: color = '#f7fbff' elif intensity < 0.4: color = '#deebf7' elif intensity < 0.6: color = '#9ecae1' elif intensity < 0.8: color = '#3182bd' else: color = '#08519c' opacity = 0.7 folium.GeoJson( data=row.geometry.__geo_interface__, style_function=lambda _, color=color, opacity=opacity: { 'fillColor': color, 'color': 'black', 'weight': 0.5, 'fillOpacity': opacity } ).add_to(m2) _add_folium_legend(m2, "Densidade de ruas (m/ha)", legend_roads) # salvar htmls + copiar p/ sessão with tempfile.NamedTemporaryFile(suffix='.html', delete=False, mode='w', encoding='utf-8') as tmp1: m1.save(tmp1.name) grid_html = Path(tmp1.name).read_text(encoding="utf-8") grid_file = _copy_into_session(tmp1.name, "grid_densidade_edificios.html") with tempfile.NamedTemporaryFile(suffix='.html', delete=False, mode='w', encoding='utf-8') as tmp2: m2.save(tmp2.name) roads_html = Path(tmp2.name).read_text(encoding="utf-8") roads_file = _copy_into_session(tmp2.name, "grid_densidade_ruas.html") # Salva GPKG correspondentes (grid + métricas) # NOTE: o usuário quer sempre o GPKG correspondente a cada mapa. # Aqui salvamos o grid com as métricas calculadas. grid_gpkg = None roads_gpkg = None try: grid_buildings = grid_gdf[["building_density", "geometry"]].copy() grid_gpkg = _save_gpkg("grid_densidade_edificios.gpkg", grid_buildings, layer="grid_buildings") except Exception: grid_gpkg = None try: grid_roads = grid_gdf[["road_density", "geometry"]].copy() roads_gpkg = _save_gpkg("grid_densidade_ruas.gpkg", grid_roads, layer="grid_roads") except Exception: roads_gpkg = None return grid_html, grid_file, roads_html, roads_file, grid_gpkg, roads_gpkg except Exception as e: print(f"Erro: {e}") return None, None, None, None, None, None def get_kmeans_data(): kmeans_html, kmeans_file, _, _, kmeans_gpkg, _ = create_clustering_maps() if kmeans_html is None: return None, None, None return _iframe_srcdoc(kmeans_html, height=650), kmeans_file, kmeans_gpkg def get_dbscan_data(): _, _, dbscan_html, dbscan_file, _, dbscan_gpkg = create_clustering_maps() if dbscan_html is None: return None, None, None return _iframe_srcdoc(dbscan_html, height=650), dbscan_file, dbscan_gpkg def get_grid_data(): grid_html, grid_file, roads_html, roads_file, grid_gpkg, roads_gpkg = create_grid_maps() if grid_html is None: return None, None, None, None, None, None return ( _iframe_srcdoc(grid_html, height=650), grid_file, grid_gpkg, _iframe_srcdoc(roads_html, height=650), roads_file, roads_gpkg ) def get_zip_download(): """Gera/atualiza o ZIP sob demanda.""" msg, zp = create_zip_for_download() return zp # ============================================================================ # INTERFACE GRADIO # ============================================================================ with gr.Blocks(title="Análise Geoespacial", theme=gr.themes.Soft()) as demo: gr.Markdown("# 🗺️ Análise Geoespacial - Edifícios e Ruas") gr.Markdown("**Aplicação para análise exploratória de dados geoespaciais**") # Download do ZIP sempre visível with gr.Row(): zip_btn = gr.Button("📦 Gerar/Atualizar ZIP (tudo)", variant="primary") zip_file = gr.File(label="⬇️ Download ZIP (tudo)") zip_btn.click(fn=get_zip_download, outputs=zip_file) with gr.Tab("📁 Upload de Dados"): gr.Markdown("## Carregue seus arquivos GPKG") with gr.Row(): buildings_file = gr.File(label="📦 Arquivo de Edifícios (GPKG)", file_types=[".gpkg"]) highways_file = gr.File(label="📦 Arquivo de Ruas (GPKG)", file_types=[".gpkg"]) load_btn = gr.Button("🔄 Carregar Dados", variant="primary", size="lg") status_output = gr.Textbox(label="Status", lines=12, interactive=False) load_btn.click( fn=load_data, inputs=[buildings_file, highways_file], outputs=status_output ) with gr.Tab("📊 Análise Exploratória"): gr.Markdown("## Estatísticas Descritivas e Visualizações") with gr.Row(): eda_btn = gr.Button("📈 Gerar Análise Exploratória", variant="primary", size="lg") eda_output = gr.Textbox(label="Relatório EDA", lines=35, interactive=False) eda_btn.click(fn=exploratory_analysis, outputs=eda_output) gr.Markdown("## Visualizações") with gr.Row(): dist_btn = gr.Button("📊 Distribuições", size="lg") types_btn = gr.Button("📊 Tipos", size="lg") with gr.Row(): dist_output = gr.Image(label="Gráficos de Distribuição") types_output = gr.Image(label="Tipos de Edifícios e Ruas") # Atualiza também o ZIP a cada geração dist_btn.click(fn=create_distributions, outputs=dist_output) types_btn.click(fn=create_types_charts, outputs=types_output) with gr.Tab("🎯 Análise Espacial"): gr.Markdown("## Clustering e Densidade") spatial_btn = gr.Button("🔍 Análise Espacial", variant="primary", size="lg") spatial_output = gr.Textbox(label="Relatório Espacial", lines=35, interactive=False) spatial_plot = gr.Plot(label="📊 Gráficos - Análise Espacial") spatial_btn.click(fn=spatial_analysis, outputs=[spatial_output, spatial_plot]) with gr.Tab("🗺️ Mapas Interativos"): gr.Markdown("## Visualizações Geoespaciais") with gr.Row(): heatmap_btn = gr.Button("🔥 Mapa de Calor", size="lg") kmeans_btn = gr.Button("🎯 K-Means", size="lg") dbscan_btn = gr.Button("🎯 DBSCAN", size="lg") heatmap_output = gr.HTML(value="

Clique no botão acima para gerar o mapa de calor

", label="Mapa de Calor") heatmap_download = gr.File(label="⬇️ Download Heatmap (HTML)") heatmap_gpkg = gr.File(label="⬇️ GPKG Heatmap (pontos)") kmeans_output = gr.HTML(value="

Clique no botão acima para gerar o mapa K-Means

", label="K-Means") kmeans_download = gr.File(label="⬇️ Download K-Means (HTML)") kmeans_gpkg = gr.File(label="⬇️ GPKG K-Means (pontos+clusters)") dbscan_output = gr.HTML(value="

Clique no botão acima para gerar o mapa DBSCAN

", label="DBSCAN") dbscan_download = gr.File(label="⬇️ Download DBSCAN (HTML)") dbscan_gpkg = gr.File(label="⬇️ GPKG DBSCAN (pontos+rótulos)") heatmap_btn.click(fn=create_heatmap, outputs=[heatmap_output, heatmap_download, heatmap_gpkg]) kmeans_btn.click(fn=get_kmeans_data, outputs=[kmeans_output, kmeans_download, kmeans_gpkg]) dbscan_btn.click(fn=get_dbscan_data, outputs=[dbscan_output, dbscan_download, dbscan_gpkg]) with gr.Tab("🔲 Mapas com Grid"): gr.Markdown("## Análise de Densidade com Grid (500m x 500m)") with gr.Row(): grid_btn = gr.Button("📊 Gerar Mapas com Grid", variant="primary", size="lg") # Grid 1: Edifícios grid_output = gr.HTML( value="

Clique no botão acima para gerar o grid de edifícios

", label="Grid de Densidade - Edifícios" ) with gr.Row(): grid_download = gr.File(label="⬇️ Download Grid Edifícios (HTML)", interactive=False) grid_gpkg = gr.File(label="⬇️ Download GPKG Grid Edifícios", interactive=False) # Grid 2: Ruas roads_output = gr.HTML( value="

Clique no botão acima para gerar o grid de ruas

", label="Grid de Densidade - Ruas" ) with gr.Row(): roads_download = gr.File(label="⬇️ Download Grid Ruas (HTML)", interactive=False) roads_gpkg = gr.File(label="⬇️ Download GPKG Grid Ruas", interactive=False) grid_btn.click( fn=get_grid_data, outputs=[grid_output, grid_download, grid_gpkg, roads_output, roads_download, roads_gpkg] ) with gr.Tab("ℹ️ Sobre"): gr.Markdown(""" ## 📖 Sobre esta Aplicação Aplicação para **análise geoespacial exploratória (EDA) completa** sobre dados de edifícios e ruas. ### ✨ Funcionalidades: - ✅ Upload de arquivos GPKG - ✅ Análise exploratória com estatísticas descritivas - ✅ Visualizações de distribuições **com legendas** - ✅ Análise espacial com clustering (K-Means e DBSCAN) - ✅ Mapas interativos **exibidos na interface** (heatmap, clustering) + legendas - ✅ Mapas com Grid de Densidade (500m x 500m) **exibidos na interface** + legendas - ✅ Download consolidado de **tudo** em um ZIP ### 🚀 Como Usar Localmente: ```bash python3.11 app_melhorado_v3.py ``` Depois acesse: http://localhost:7860 """) if __name__ == "__main__": print("=" * 80) print("🗺️ APLICAÇÃO GRADIO - ANÁLISE GEOESPACIAL (UI + ZIP)") print("=" * 80) print("\n✓ Iniciando aplicação...") print("✓ Acesse: http://localhost:7860") print("✓ Pressione CTRL+C para parar\n") # Em Hugging Face Spaces, a porta é fornecida via variável de ambiente PORT. server_port = int(os.environ.get('PORT', '7860')) demo.launch(server_name="0.0.0.0", server_port=server_port, share=False, allowed_paths=[str(OUTPUT_ROOT)])