# -*- coding: utf-8 -*- """Untitled0.ipynb Automatically generated by Colab. Original file is located at https://colab.research.google.com/drive/1lA4vvx9sbWFfjQHAmGs8ADgwhNOypfsM """ import pandas as pd import numpy as np import matplotlib.pyplot as plt import gradio as gr import io import base64 from datetime import datetime from sklearn.ensemble import RandomForestRegressor from sklearn.metrics import r2_score, mean_squared_error import tempfile print("🚀 Iniciando GeoPredict en Hugging Face...") # ============================================================================== # BLOQUE 1: ENTRENAMIENTO DEL MODELO (se ejecuta al iniciar) # ============================================================================== print("📂 Cargando y entrenando modelos...") # Cargar datos df = pd.read_excel('base_datos.xlsx') # Limpieza robusta df['N60'] = pd.to_numeric(df['N60'], errors='coerce') df['φ_grados'] = pd.to_numeric(df['φ_grados'], errors='coerce') df['Densidad_relativa'] = df['Densidad_relativa'].astype(str).str.replace(r'[-%]', '', regex=True) df['Densidad_relativa'] = pd.to_numeric(df['Densidad_relativa'], errors='coerce') df['Cu/Su (KPa)'] = pd.to_numeric(df['Cu/Su (KPa)'], errors='coerce') df = df.dropna(subset=['MATERIAL', 'N60'], how='all') # Configuración de modelos config = [ ('ARENA', 'φ_grados', 'Ángulo de fricción (φ)', 'grados'), ('GRAVA', 'φ_grados', 'Ángulo de fricción (φ)', 'grados'), ('ARCILLA', 'Cu/Su (KPa)', 'Resistencia no drenada (Cu/Su)', 'kPa'), ('ARENA', 'Densidad_relativa', 'Densidad relativa (Dr)', 'decimal'), ('GRAVA', 'Densidad_relativa', 'Densidad relativa (Dr)', 'decimal') ] modelos_rf = {} for material, col_y, nombre_prop, unidad in config: print(f"🧠 Entrenando: {material} → {nombre_prop}") df_mat = df[df['MATERIAL'] == material].copy() X = df_mat[['N60']] y = df_mat[col_y] mask = y.notnull() X, y = X[mask], y[mask] if len(X) < 5: print(f" ⚠️ Pocos datos. Saltando...") continue # Entrenar Random Forest model = RandomForestRegressor(n_estimators=100, random_state=42) model.fit(X, y) # Evaluar y_pred = model.predict(X) r2 = r2_score(y, y_pred) rmse = np.sqrt(mean_squared_error(y, y_pred)) # Guardar modelo clave = f"{material}_{col_y}" modelos_rf[clave] = { 'modelo': model, 'R2': r2, 'RMSE': rmse, 'unidad': unidad, 'propiedad': nombre_prop, 'X_train': X.values.flatten(), 'y_train': y.values.flatten() } print("✅ Modelos entrenados correctamente") # ============================================================================== # BLOQUE 2: CONFIGURACIÓN Y FUNCIONES PARA GRADIO # ============================================================================== # Configuración profesional de matplotlib plt.rcParams['font.size'] = 12 plt.rcParams['axes.grid'] = True plt.rcParams['grid.alpha'] = 0.3 # RANGOS por material RANGOS_MATERIAL = { 'ARENA': {'min': 1, 'max': 60, 'defecto': 25, 'rango_real': "1-60"}, 'GRAVA': {'min': 5, 'max': 100, 'defecto': 40, 'rango_real': "5-100"}, 'ARCILLA': {'min': 5, 'max': 30, 'defecto': 15, 'rango_real': "5-30"} } def predecir_propiedades_completo(material, n60, nombre_ing, ubicacion, proyecto): """Función completa para predicciones profesionales""" try: # Validar rango rango = RANGOS_MATERIAL[material] if n60 < rango['min'] or n60 > rango['max']: raise ValueError(f"N60 = {n60} fuera del rango válido para {material} ({rango['min']}-{rango['max']})") predicciones = {} graficas_base64 = [] detalles_modelo = [] if material in ['ARENA', 'GRAVA']: # Predicción para φ clave_phi = f"{material}_φ_grados" if clave_phi in modelos_rf: info = modelos_rf[clave_phi] phi_pred = info['modelo'].predict([[n60]])[0] predicciones['Ángulo de Fricción (φ)'] = { 'valor': f"{phi_pred:.1f}°", 'valor_num': phi_pred, 'r2': info['R2'], 'rmse': info['RMSE'] } # Gráfica para φ fig, ax = plt.subplots(figsize=(10, 6)) sample_size = min(50, len(info['X_train'])) sample_indices = np.random.choice(len(info['X_train']), size=sample_size, replace=False) X_sample = info['X_train'][sample_indices] y_sample = info['y_train'][sample_indices] ax.scatter(X_sample, y_sample, alpha=0.7, color='steelblue', s=60, label='Datos de Campo', edgecolors='white', linewidth=0.5) N60_plot = np.linspace(info['X_train'].min(), info['X_train'].max(), 100).reshape(-1, 1) y_plot = info['modelo'].predict(N60_plot) ax.plot(N60_plot, y_plot, color='purple', linewidth=3, label='Modelo Random Forest') ax.scatter([n60], [phi_pred], color='red', s=150, zorder=5, marker='*', label=f'Predicción: {phi_pred:.1f}°') ax.axvline(x=n60, color='red', linestyle='--', alpha=0.5) ax.axhline(y=phi_pred, color='red', linestyle='--', alpha=0.5) ax.set_title(f'{material}: Ángulo de Fricción (φ)\nR² = {info["R2"]:.3f} | RMSE = {info["RMSE"]:.2f}', fontsize=14, fontweight='bold') ax.set_xlabel('N60 (SPT)', fontsize=12) ax.set_ylabel('φ (grados)', fontsize=12) ax.legend() ax.grid(True, alpha=0.3) plt.tight_layout() buf = io.BytesIO() plt.savefig(buf, format='png', dpi=100, bbox_inches='tight') buf.seek(0) graficas_base64.append(base64.b64encode(buf.getvalue()).decode('utf-8')) plt.close() # Predicción para Dr clave_dr = f"{material}_Densidad_relativa" if clave_dr in modelos_rf: info = modelos_rf[clave_dr] dr_pred = info['modelo'].predict([[n60]])[0] * 100 predicciones['Densidad Relativa (Dr)'] = { 'valor': f"{dr_pred:.1f}%", 'valor_num': dr_pred, 'r2': info['R2'], 'rmse': info['RMSE'] } # Gráfica para Dr fig, ax = plt.subplots(figsize=(10, 6)) sample_size = min(50, len(info['X_train'])) sample_indices = np.random.choice(len(info['X_train']), size=sample_size, replace=False) X_sample = info['X_train'][sample_indices] y_sample = info['y_train'][sample_indices] * 100 ax.scatter(X_sample, y_sample, alpha=0.7, color='green', s=60, label='Datos de Campo', edgecolors='white', linewidth=0.5) N60_plot = np.linspace(info['X_train'].min(), info['X_train'].max(), 100).reshape(-1, 1) y_plot = info['modelo'].predict(N60_plot) * 100 ax.plot(N60_plot, y_plot, color='purple', linewidth=3, label='Modelo Random Forest') ax.scatter([n60], [dr_pred], color='red', s=150, zorder=5, marker='*', label=f'Predicción: {dr_pred:.1f}%') ax.axvline(x=n60, color='red', linestyle='--', alpha=0.5) ax.axhline(y=dr_pred, color='red', linestyle='--', alpha=0.5) ax.set_title(f'{material}: Densidad Relativa (Dr)\nR² = {info["R2"]:.3f} | RMSE = {info["RMSE"]:.3f}', fontsize=14, fontweight='bold') ax.set_xlabel('N60 (SPT)', fontsize=12) ax.set_ylabel('Dr (%)', fontsize=12) ax.legend() ax.grid(True, alpha=0.3) plt.tight_layout() buf = io.BytesIO() plt.savefig(buf, format='png', dpi=100, bbox_inches='tight') buf.seek(0) graficas_base64.append(base64.b64encode(buf.getvalue()).decode('utf-8')) plt.close() elif material == 'ARCILLA': clave_cu = "ARCILLA_Cu/Su (KPa)" if clave_cu in modelos_rf: info = modelos_rf[clave_cu] cu_pred = info['modelo'].predict([[n60]])[0] predicciones['Resistencia No Drenada (Cu)'] = { 'valor': f"{cu_pred:.1f} kPa", 'valor_num': cu_pred, 'r2': info['R2'], 'rmse': info['RMSE'] } # Gráfica para Cu fig, ax = plt.subplots(figsize=(10, 6)) sample_size = min(50, len(info['X_train'])) sample_indices = np.random.choice(len(info['X_train']), size=sample_size, replace=False) X_sample = info['X_train'][sample_indices] y_sample = info['y_train'][sample_indices] ax.scatter(X_sample, y_sample, alpha=0.7, color='coral', s=60, label='Datos de Campo', edgecolors='white', linewidth=0.5) N60_plot = np.linspace(info['X_train'].min(), info['X_train'].max(), 100).reshape(-1, 1) y_plot = info['modelo'].predict(N60_plot) ax.plot(N60_plot, y_plot, color='purple', linewidth=3, label='Modelo Random Forest') ax.scatter([n60], [cu_pred], color='red', s=150, zorder=5, marker='*', label=f'Predicción: {cu_pred:.1f} kPa') ax.axvline(x=n60, color='red', linestyle='--', alpha=0.5) ax.axhline(y=cu_pred, color='red', linestyle='--', alpha=0.5) ax.set_title(f'Arcilla: Resistencia No Drenada (Cu)\nR² = {info["R2"]:.3f} | RMSE = {info["RMSE"]:.2f}', fontsize=14, fontweight='bold') ax.set_xlabel('N60 (SPT)', fontsize=12) ax.set_ylabel('Cu (kPa)', fontsize=12) ax.legend() ax.grid(True, alpha=0.3) plt.tight_layout() buf = io.BytesIO() plt.savefig(buf, format='png', dpi=100, bbox_inches='tight') buf.seek(0) graficas_base64.append(base64.b64encode(buf.getvalue()).decode('utf-8')) plt.close() # Generar reporte HTML reporte_html = generar_reporte_completo(predicciones, graficas_base64, material, n60, nombre_ing, ubicacion, proyecto) # HTML para mostrar en la interfaz resultados_html = f"""
{material} | N60 = {n60} | {datetime.now().strftime('%d/%m/%Y %H:%M')}
{str(e)}
{material} | N60 = {n60} | {datetime.now().strftime('%d/%m/%Y %H:%M')}
Proyecto: {proyecto}
Ubicación: {ubicacion}
Ingeniero: {nombre_ing}
Material: {material}
N60 (SPT): {n60}
Fecha: {datetime.now().strftime('%d/%m/%Y %H:%M')}
GeoPredict Pro - Sistema de Predicción Geotécnica con IA
Reporte generado automáticamente el {datetime.now().strftime('%d/%m/%Y')}
📄 Ejecuta una predicción para generar el reporte