Spaces:

jcalbornoz
/

comparablesavaluos

Sleeping

App Files Files Community

jcalbornoz commited on Dec 23, 2025

Commit

001054b

verified ·

1 Parent(s): 729b57b

Update app.py

Browse files

Files changed (1) hide show

app.py +31 -65

app.py CHANGED Viewed

@@ -6,12 +6,12 @@ import sqlite3
 import os
 import numpy as np
 from datetime import datetime, timedelta
-from urllib.parse import urlparse, urlunparse
 # --- 1. CONFIGURACIÓN ---
 API_KEY = os.getenv("GOOGLE_API_KEY")
 SEARCH_ENGINE_ID = os.getenv("SEARCH_ENGINE_ID")
-DB_NAME = "data_cache_v13.db" # Nueva DB para limpiar filtros anteriores
 # --- 2. GESTIÓN DE BASE DE DATOS ---
 def iniciar_db():
@@ -51,26 +51,16 @@ def leer_cache(query):
 # --- 3. EXTRACCIÓN Y VALIDACIÓN ---
 def analizar_tipo_url(url):
-    """
-    Retorna 1 si es INMUEBLE DIRECTO, 0 si es LISTADO/BUSQUEDA.
-    """
     url = url.lower()
-    # 1. Indicadores de Inmueble Único (Fuerte)
     positivos = ['/inmueble/', '/proyecto/', '/propiedad/', 'detalle', 'p-', 'id-', 'cod-', 'mco-', 'mla-']
     if any(p in url for p in positivos): return 1
-    # 2. Indicadores de Listado (Fuerte)
     negativos = ['listado', 'resultados', 'buscar', 'search', 'ordenar', 'filtrar', 'page']
     if any(n in url for n in negativos): return 0
-    # 3. Casos neutros (Asumimos listado por precaución)
     return 0
 def limpiar_url(url):
     try:
         parsed = urlparse(url)
-        # Quitamos query params para intentar limpiar redirecciones
         clean = urlunparse((parsed.scheme, parsed.netloc, parsed.path, '', '', ''))
         return clean
     except:
@@ -98,7 +88,6 @@ def extraer_coordenadas(item):
 def parsear_texto_completo(texto):
     texto = texto.lower()
-    # Precio
     precio = 0
     match_precio = re.search(r'\$\s?([\d.,]+)', texto)
     if match_precio:
@@ -106,7 +95,6 @@ def parsear_texto_completo(texto):
         try: precio = float(s)
         except: pass
-    # Área
     area = 0
     match_area = re.search(r'(\d+[\.,]?\d*)\s?(m2|mt|mts|metro)', texto)
     if match_area:
@@ -114,21 +102,18 @@ def parsear_texto_completo(texto):
         try: area = float(s_area)
         except: pass
-    # Habitaciones
     habs = 0
     match_habs = re.search(r'(\d+)\s?(hab|alcoba|dormitorio)', texto)
     if match_habs:
         try: habs = int(match_habs.group(1))
         except: pass
-    # Baños
     banos = 0
     match_banos = re.search(r'(\d+)\s?(baño|bano)', texto)
     if match_banos:
         try: banos = int(match_banos.group(1))
         except: pass
-    # Garajes
     garajes = 0
     match_garaje = re.search(r'(\d+)\s?(parqueadero|garaje)', texto)
     if match_garaje:
@@ -137,14 +122,12 @@ def parsear_texto_completo(texto):
     elif "garaje" in texto or "parqueadero" in texto:
         garajes = 1
-    # Estrato
     estrato = 0
     match_estrato = re.search(r'estrato\s?:?\s?(\d)', texto)
     if match_estrato:
         try: estrato = int(match_estrato.group(1))
         except: pass
-    # Antigüedad
     antiguedad = -1
     if "estrenar" in texto or "nuevo" in texto or "sobre planos" in texto:
         antiguedad = 0
@@ -154,7 +137,6 @@ def parsear_texto_completo(texto):
             try: antiguedad = int(match_anos.group(1))
             except: pass
-    # Seguridad
     seguridad = 0
     if any(k in texto for k in ['conjunto', 'vigilancia', 'porteria', 'seguridad', 'club house', 'cerrado']):
         seguridad = 1
@@ -166,8 +148,6 @@ def buscar_google(query):
     if not API_KEY or not SEARCH_ENGINE_ID: return []
     url = "https://www.googleapis.com/customsearch/v1"
-    # Quitamos filtros negativos (-listado) porque estaban bloqueando todo.
-    # Usamos "detalle" como sugerencia suave.
     query_optimizada = f"{query} detalle"
     query_optimizada = query_optimizada.replace(",", " OR ")
@@ -184,11 +164,7 @@ def buscar_google(query):
         if 'items' in data:
             for item in data['items']:
                 raw_link = item.get('link', '')
-                # Clasificamos la URL (1=Directo, 0=Listado)
-                # NOTA: Ya no filtramos (continue), aceptamos ambos.
                 es_directo = analizar_tipo_url(raw_link)
                 final_link = limpiar_url(raw_link)
                 texto = f"{item.get('title')} {item.get('snippet')}"
@@ -200,7 +176,6 @@ def buscar_google(query):
                 elif "metrocuadrado" in raw_link: fuente = "Metrocuadrado"
                 elif "wasi" in raw_link: fuente = "Wasi"
-                # Guardamos si encontramos datos válidos, aunque el link sea un listado
                 if precio > 0 or area > 0:
                     resultados.append({
                         'titulo': item.get('title'),
@@ -219,34 +194,28 @@ def calcular_scores(df, p_ref, a_ref, h_ref, b_ref, g_ref, e_ref, antiguedad_ref
     if df.empty: return df
     df_f = df.copy()
-    # 1. Precio (25%)
     df_f['diff_p'] = abs(df_f['precio'] - p_ref) / p_ref
     score_p = np.maximum(0, 1 - df_f['diff_p'])
-    # 2. Área (20%)
     df_f['diff_a'] = df_f['area'].apply(lambda x: abs(x - a_ref)/a_ref if x > 0 else 1.0)
     score_a = np.maximum(0, 1 - df_f['diff_a'])
-    # 3. Habitaciones (10%)
     score_h = df_f['habs'].apply(lambda x: 1.0 if x == h_ref else (0.9 if x==0 else (0.5 if abs(x-h_ref)<=1 else 0)))
-    # 4. Baños (10%)
     score_b = df_f['banos'].apply(lambda x: 1.0 if x == b_ref else (0.9 if x==0 else (0.6 if abs(x-b_ref)<=1 else 0.2)))
-    # 5. Garajes (10%)
     score_g = df_f['garajes'].apply(lambda x: 1.0 if x >= g_ref else (0.5 if x < g_ref and x > 0 else 0.8 if x==0 else 0))
-    # 6. Estrato (10%)
     score_e = df_f['estrato'].apply(lambda x: 1.0 if x == e_ref else (0.9 if x==0 else (0.5 if abs(x-e_ref)<=1 else 0)))
-    # 7. Antigüedad (10%)
     def calc_edad(x, ref):
         if x == -1: return 0.8
         if ref == 0: return 1.0 if x == 0 else max(0, 1 - (x/20))
         return max(0, 1 - (abs(x - ref) / 20))
     score_ant = df_f['antiguedad'].apply(lambda x: calc_edad(x, antiguedad_ref))
-    # 8. Condominio (5%)
     def calc_condo(x, quiere_condo):
         if not quiere_condo: return 1.0
         return 1.0 if x == 1 else 0.2
@@ -284,13 +253,8 @@ def motor(zona, tipo, precio, area, habs, banos, garajes, estrato, antiguedad, e
             margin-bottom: 12px;
             box-shadow: 0 2px 4px rgba(0,0,0,0.05);
         }
-        .btn-direct {
-            color: #2563eb !important; /* Azul */
-        }
-        .btn-list {
-            color: #d97706 !important; /* Naranja */
-            font-style: italic;
-        }
         .map-btn {
             background-color: #ea4335 !important;
             color: white !important;
@@ -300,6 +264,15 @@ def motor(zona, tipo, precio, area, habs, banos, garajes, estrato, antiguedad, e
             display: inline-block;
             margin-top: 5px;
         }
     </style>
     <div class="result-container">
     """
@@ -313,35 +286,23 @@ def motor(zona, tipo, precio, area, habs, banos, garajes, estrato, antiguedad, e
     if df is None:
         origen = "🌐 Google API"
         lista = buscar_google(q)
         if lista and "error" in lista[0]:
             return f"{css_injection}<h3 style='color:red !important;'>⚠️ Límite de Cuota Excedido.</h3></div>"
         if lista:
             guardar_cache(q, lista)
             df = pd.DataFrame(lista)
     if df is None or df.empty:
-        return f"{css_injection}<h3>❌ No se encontraron datos.</h3><p>Google no devolvió ningún resultado con precio/área legible.</p></div>"
     df_similares = calcular_scores(df, precio, area, habs, banos, garajes, estrato, antiguedad, es_condominio)
-    # CÁLCULO PROMEDIOS BLINDADO
-    # Filtro: Score decente, área > 10, precio > 1 Millón
-    df_calc = df_similares[
-        (df_similares['score'] >= 40) &
-        (df_similares['area'] > 10) &
-        (df_similares['precio'] > 1000000)
-    ]
-    if df_calc.empty and not df_similares.empty:
-        df_calc = df_similares # Si filtro estricto falla, usar todo lo disponible
     prom_precio = df_calc['precio'].mean() if not df_calc.empty else 0
     if not df_calc.empty:
-        # Calcular precio por metro cuadrado individualmente y luego promediar
-        # Esto evita errores de sumar áreas dispares
         df_calc['m2_individual'] = df_calc['precio'] / df_calc['area']
         prom_m2 = df_calc['m2_individual'].mean()
     else:
@@ -367,11 +328,17 @@ def motor(zona, tipo, precio, area, habs, banos, garajes, estrato, antiguedad, e
         txt_area = f"{row['area']} m²" if row['area'] > 0 else "N/A"
-        # Botones
-        btn_mapa = ""
         if row['lat'] and row['lon']:
             gmaps_link = f"https://www.google.com/maps/search/?api=1&query={row['lat']},{row['lon']}"
-            btn_mapa = f"<a href='{gmaps_link}' target='_blank' class='map-btn white-text'>📍 Ver en Mapa</a>"
         if row['es_directo'] == 1:
             btn_link = f"<a href='{row['url']}' target='_blank' class='btn-direct'>🔗 Ver Inmueble</a>"
@@ -423,8 +390,7 @@ def motor(zona, tipo, precio, area, habs, banos, garajes, estrato, antiguedad, e
 iniciar_db()
 with gr.Blocks(theme=gr.themes.Base()) as demo:
-    gr.Markdown("# 🏢 Valuador Híbrido V13")
-    gr.Markdown("Muestra inmuebles específicos y listados de referencia si no hay directos.")
     with gr.Row():
         with gr.Column(scale=2):

 import os
 import numpy as np
 from datetime import datetime, timedelta
+from urllib.parse import urlparse, urlunparse, quote
 # --- 1. CONFIGURACIÓN ---
 API_KEY = os.getenv("GOOGLE_API_KEY")
 SEARCH_ENGINE_ID = os.getenv("SEARCH_ENGINE_ID")
+DB_NAME = "data_cache_v14.db"
 # --- 2. GESTIÓN DE BASE DE DATOS ---
 def iniciar_db():
 # --- 3. EXTRACCIÓN Y VALIDACIÓN ---
 def analizar_tipo_url(url):
     url = url.lower()
     positivos = ['/inmueble/', '/proyecto/', '/propiedad/', 'detalle', 'p-', 'id-', 'cod-', 'mco-', 'mla-']
     if any(p in url for p in positivos): return 1
     negativos = ['listado', 'resultados', 'buscar', 'search', 'ordenar', 'filtrar', 'page']
     if any(n in url for n in negativos): return 0
     return 0
 def limpiar_url(url):
     try:
         parsed = urlparse(url)
         clean = urlunparse((parsed.scheme, parsed.netloc, parsed.path, '', '', ''))
         return clean
     except:
 def parsear_texto_completo(texto):
     texto = texto.lower()
     precio = 0
     match_precio = re.search(r'\$\s?([\d.,]+)', texto)
     if match_precio:
         try: precio = float(s)
         except: pass
     area = 0
     match_area = re.search(r'(\d+[\.,]?\d*)\s?(m2|mt|mts|metro)', texto)
     if match_area:
         try: area = float(s_area)
         except: pass
     habs = 0
     match_habs = re.search(r'(\d+)\s?(hab|alcoba|dormitorio)', texto)
     if match_habs:
         try: habs = int(match_habs.group(1))
         except: pass
     banos = 0
     match_banos = re.search(r'(\d+)\s?(baño|bano)', texto)
     if match_banos:
         try: banos = int(match_banos.group(1))
         except: pass
     garajes = 0
     match_garaje = re.search(r'(\d+)\s?(parqueadero|garaje)', texto)
     if match_garaje:
     elif "garaje" in texto or "parqueadero" in texto:
         garajes = 1
     estrato = 0
     match_estrato = re.search(r'estrato\s?:?\s?(\d)', texto)
     if match_estrato:
         try: estrato = int(match_estrato.group(1))
         except: pass
     antiguedad = -1
     if "estrenar" in texto or "nuevo" in texto or "sobre planos" in texto:
         antiguedad = 0
             try: antiguedad = int(match_anos.group(1))
             except: pass
     seguridad = 0
     if any(k in texto for k in ['conjunto', 'vigilancia', 'porteria', 'seguridad', 'club house', 'cerrado']):
         seguridad = 1
     if not API_KEY or not SEARCH_ENGINE_ID: return []
     url = "https://www.googleapis.com/customsearch/v1"
     query_optimizada = f"{query} detalle"
     query_optimizada = query_optimizada.replace(",", " OR ")
         if 'items' in data:
             for item in data['items']:
                 raw_link = item.get('link', '')
                 es_directo = analizar_tipo_url(raw_link)
                 final_link = limpiar_url(raw_link)
                 texto = f"{item.get('title')} {item.get('snippet')}"
                 elif "metrocuadrado" in raw_link: fuente = "Metrocuadrado"
                 elif "wasi" in raw_link: fuente = "Wasi"
                 if precio > 0 or area > 0:
                     resultados.append({
                         'titulo': item.get('title'),
     if df.empty: return df
     df_f = df.copy()
+    # Precios y Áreas
     df_f['diff_p'] = abs(df_f['precio'] - p_ref) / p_ref
     score_p = np.maximum(0, 1 - df_f['diff_p'])
     df_f['diff_a'] = df_f['area'].apply(lambda x: abs(x - a_ref)/a_ref if x > 0 else 1.0)
     score_a = np.maximum(0, 1 - df_f['diff_a'])
+    # Habitaciones/Baños
     score_h = df_f['habs'].apply(lambda x: 1.0 if x == h_ref else (0.9 if x==0 else (0.5 if abs(x-h_ref)<=1 else 0)))
     score_b = df_f['banos'].apply(lambda x: 1.0 if x == b_ref else (0.9 if x==0 else (0.6 if abs(x-b_ref)<=1 else 0.2)))
+    # Garajes/Estrato
     score_g = df_f['garajes'].apply(lambda x: 1.0 if x >= g_ref else (0.5 if x < g_ref and x > 0 else 0.8 if x==0 else 0))
     score_e = df_f['estrato'].apply(lambda x: 1.0 if x == e_ref else (0.9 if x==0 else (0.5 if abs(x-e_ref)<=1 else 0)))
+    # Antigüedad/Condominio
     def calc_edad(x, ref):
         if x == -1: return 0.8
         if ref == 0: return 1.0 if x == 0 else max(0, 1 - (x/20))
         return max(0, 1 - (abs(x - ref) / 20))
     score_ant = df_f['antiguedad'].apply(lambda x: calc_edad(x, antiguedad_ref))
     def calc_condo(x, quiere_condo):
         if not quiere_condo: return 1.0
         return 1.0 if x == 1 else 0.2
             margin-bottom: 12px;
             box-shadow: 0 2px 4px rgba(0,0,0,0.05);
         }
+        .btn-direct { color: #2563eb !important; }
+        .btn-list { color: #d97706 !important; font-style: italic; }
         .map-btn {
             background-color: #ea4335 !important;
             color: white !important;
             display: inline-block;
             margin-top: 5px;
         }
+        .map-btn-gray {
+            background-color: #5f6368 !important;
+            color: white !important;
+            padding: 4px 10px;
+            border-radius: 15px;
+            font-size: 0.8em;
+            display: inline-block;
+            margin-top: 5px;
+        }
     </style>
     <div class="result-container">
     """
     if df is None:
         origen = "🌐 Google API"
         lista = buscar_google(q)
         if lista and "error" in lista[0]:
             return f"{css_injection}<h3 style='color:red !important;'>⚠️ Límite de Cuota Excedido.</h3></div>"
         if lista:
             guardar_cache(q, lista)
             df = pd.DataFrame(lista)
     if df is None or df.empty:
+        return f"{css_injection}<h3>❌ No se encontraron datos válidos.</h3></div>"
     df_similares = calcular_scores(df, precio, area, habs, banos, garajes, estrato, antiguedad, es_condominio)
+    # Matemáticas Blindadas
+    df_calc = df_similares[(df_similares['score'] >= 40) & (df_similares['area'] > 10) & (df_similares['precio'] > 1000000)]
+    if df_calc.empty: df_calc = df_similares[df_similares['area'] > 10]
     prom_precio = df_calc['precio'].mean() if not df_calc.empty else 0
     if not df_calc.empty:
         df_calc['m2_individual'] = df_calc['precio'] / df_calc['area']
         prom_m2 = df_calc['m2_individual'].mean()
     else:
         txt_area = f"{row['area']} m²" if row['area'] > 0 else "N/A"
+        # --- LÓGICA DE MAPA INTELIGENTE ---
         if row['lat'] and row['lon']:
+            # Coordenadas exactas encontradas
             gmaps_link = f"https://www.google.com/maps/search/?api=1&query={row['lat']},{row['lon']}"
+            btn_mapa = f"<a href='{gmaps_link}' target='_blank' class='map-btn white-text'>📍 Ver Ubicación Exacta</a>"
+        else:
+            # Búsqueda Inversa por Título (Fallback)
+            titulo_safe = quote(f"{row['titulo']} {zona}")
+            gmaps_link = f"https://www.google.com/maps/search/?api=1&query={titulo_safe}"
+            btn_mapa = f"<a href='{gmaps_link}' target='_blank' class='map-btn-gray white-text'>📍 Buscar en Mapa</a>"
+        # ----------------------------------
         if row['es_directo'] == 1:
             btn_link = f"<a href='{row['url']}' target='_blank' class='btn-direct'>🔗 Ver Inmueble</a>"
 iniciar_db()
 with gr.Blocks(theme=gr.themes.Base()) as demo:
+    gr.Markdown("# 🏢 Valuador Inteligente V14 (Mapa Activo)")
     with gr.Row():
         with gr.Column(scale=2):