Update app.py
Browse files
app.py
CHANGED
|
@@ -24,7 +24,7 @@ def fetch_google_suggestions(query, lang_code="es", client="firefox"):
|
|
| 24 |
else:
|
| 25 |
return []
|
| 26 |
|
| 27 |
-
# Funci贸n para obtener sugerencias de Brave
|
| 28 |
def fetch_brave_suggestions(query, lang_code="es"):
|
| 29 |
encoded_query = urllib.parse.quote(query)
|
| 30 |
url = f"https://search.brave.com/api/suggest?q={encoded_query}"
|
|
@@ -33,7 +33,8 @@ def fetch_brave_suggestions(query, lang_code="es"):
|
|
| 33 |
try:
|
| 34 |
data = response.json()
|
| 35 |
if len(data) > 1 and isinstance(data[1], list):
|
| 36 |
-
|
|
|
|
| 37 |
else:
|
| 38 |
print("No se encontraron sugerencias en el formato esperado (Brave).")
|
| 39 |
return []
|
|
@@ -43,114 +44,7 @@ def fetch_brave_suggestions(query, lang_code="es"):
|
|
| 43 |
else:
|
| 44 |
return []
|
| 45 |
|
| 46 |
-
#
|
| 47 |
-
def fetch_qwant_suggestions(query, lang_code="es"):
|
| 48 |
-
encoded_query = urllib.parse.quote(query)
|
| 49 |
-
url = f"https://api.qwant.com/api/suggest/?client=opensearch&q={encoded_query}"
|
| 50 |
-
response = requests.get(url)
|
| 51 |
-
if response.status_code == 200:
|
| 52 |
-
try:
|
| 53 |
-
data = response.json()
|
| 54 |
-
if len(data) > 1 and isinstance(data[1], list):
|
| 55 |
-
return [normalize_keyword(item) for item in data[1]]
|
| 56 |
-
else:
|
| 57 |
-
print("No se encontraron sugerencias en el formato esperado (Qwant).")
|
| 58 |
-
return []
|
| 59 |
-
except ValueError:
|
| 60 |
-
print("Error decodificando JSON de Qwant")
|
| 61 |
-
return []
|
| 62 |
-
else:
|
| 63 |
-
return []
|
| 64 |
-
|
| 65 |
-
# Funci贸n para obtener sugerencias de DuckDuckGo
|
| 66 |
-
def fetch_duckduckgo_suggestions(query, lang_code="es"):
|
| 67 |
-
encoded_query = urllib.parse.quote(query)
|
| 68 |
-
url = f"https://duckduckgo.com/ac/?q={encoded_query}&kl={lang_code}"
|
| 69 |
-
response = requests.get(url)
|
| 70 |
-
if response.status_code == 200:
|
| 71 |
-
try:
|
| 72 |
-
data = response.json()
|
| 73 |
-
return [normalize_keyword(item['phrase']) for item in data]
|
| 74 |
-
except ValueError:
|
| 75 |
-
print("Error decodificando JSON de DuckDuckGo")
|
| 76 |
-
return []
|
| 77 |
-
else:
|
| 78 |
-
return []
|
| 79 |
-
|
| 80 |
-
# Funci贸n para obtener sugerencias de YouTube usando la API anterior
|
| 81 |
-
def fetch_youtube_suggestions(query, lang_code="es"):
|
| 82 |
-
encoded_query = urllib.parse.quote(query)
|
| 83 |
-
url = f"http://suggestqueries.google.com/complete/search?client=youtube&hl={lang_code}&q={encoded_query}"
|
| 84 |
-
response = requests.get(url)
|
| 85 |
-
if response.status_code == 200:
|
| 86 |
-
try:
|
| 87 |
-
match = re.search(r'window\.google\.ac\.h\(\["[^"]*",\[(.*?)\],', response.text)
|
| 88 |
-
if match:
|
| 89 |
-
suggestions_data = match.group(1)
|
| 90 |
-
return [normalize_keyword(suggestion) for suggestion in re.findall(r'\["([^"]+)"', suggestions_data)]
|
| 91 |
-
else:
|
| 92 |
-
print("No se encontraron sugerencias en el formato esperado (YouTube antiguo).")
|
| 93 |
-
return []
|
| 94 |
-
except Exception as e:
|
| 95 |
-
print(f"Error procesando la respuesta de YouTube (antiguo): {e}")
|
| 96 |
-
return []
|
| 97 |
-
else:
|
| 98 |
-
return []
|
| 99 |
-
|
| 100 |
-
# Funci贸n para obtener sugerencias de YouTube usando la nueva API
|
| 101 |
-
def fetch_youtube_suggestions_new(query, lang_code="es"):
|
| 102 |
-
encoded_query = urllib.parse.quote(query)
|
| 103 |
-
url = f"https://suggestqueries-clients6.youtube.com/complete/search?client=youtube&ds=yt&q={encoded_query}&hl={lang_code}"
|
| 104 |
-
response = requests.get(url)
|
| 105 |
-
if response.status_code == 200:
|
| 106 |
-
try:
|
| 107 |
-
match = re.search(r'window\.google\.ac\.h\(\["[^"]*",\[(.*?)\],', response.text)
|
| 108 |
-
if match:
|
| 109 |
-
suggestions_data = match.group(1)
|
| 110 |
-
return [normalize_keyword(suggestion) for suggestion in re.findall(r'\["([^"]+)"', suggestions_data)]
|
| 111 |
-
else:
|
| 112 |
-
print("No se encontraron sugerencias en el formato esperado (nueva API de YouTube).")
|
| 113 |
-
return []
|
| 114 |
-
except Exception as e:
|
| 115 |
-
print(f"Error procesando la respuesta de la nueva API de YouTube: {e}")
|
| 116 |
-
return []
|
| 117 |
-
else:
|
| 118 |
-
return []
|
| 119 |
-
|
| 120 |
-
# Funci贸n para obtener sugerencias de Bing
|
| 121 |
-
def fetch_bing_suggestions(query, market="en-US"):
|
| 122 |
-
url = "https://api.bing.com/qsml.aspx"
|
| 123 |
-
params = {"Market": market, "query": query}
|
| 124 |
-
headers = {"User-agent": "Mozilla/5.0"}
|
| 125 |
-
response = requests.get(url, params=params, headers=headers)
|
| 126 |
-
if response.status_code == 200:
|
| 127 |
-
try:
|
| 128 |
-
obj = xmltodict.parse(response.content)
|
| 129 |
-
suggestions = obj['SearchSuggestion']['Section']['Item']
|
| 130 |
-
if isinstance(suggestions, list):
|
| 131 |
-
return [normalize_keyword(s['Text']) for s in suggestions]
|
| 132 |
-
elif isinstance(suggestions, dict):
|
| 133 |
-
return [normalize_keyword(suggestions['Text'])]
|
| 134 |
-
except Exception as e:
|
| 135 |
-
print(f"Error procesando la respuesta de Bing: {e}")
|
| 136 |
-
return []
|
| 137 |
-
else:
|
| 138 |
-
return []
|
| 139 |
-
|
| 140 |
-
# Funci贸n para obtener sugerencias de Amazon
|
| 141 |
-
def fetch_amazon_suggestions(query, market_id="ATVPDKIKX0DER", alias="aps"):
|
| 142 |
-
url = "https://completion.amazon.com/api/2017/suggestions"
|
| 143 |
-
params = {"mid": market_id, "alias": alias, "prefix": query}
|
| 144 |
-
response = requests.get(url, params=params)
|
| 145 |
-
if response.status_code == 200:
|
| 146 |
-
try:
|
| 147 |
-
data = response.json()
|
| 148 |
-
return [normalize_keyword(item['value']) for item in data.get('suggestions', [])]
|
| 149 |
-
except ValueError:
|
| 150 |
-
print("Error decodificando JSON de Amazon")
|
| 151 |
-
return []
|
| 152 |
-
else:
|
| 153 |
-
return []
|
| 154 |
|
| 155 |
# Funci贸n para expandir la palabra clave
|
| 156 |
def expand_keyword(keyword):
|
|
@@ -179,16 +73,21 @@ def main(keyword):
|
|
| 179 |
|
| 180 |
# Obtener sugerencias de Google con diferentes clients
|
| 181 |
google_clients = ["firefox", "chrome", "android", "desktop", "opera"]
|
|
|
|
| 182 |
for exp_keyword in expanded_keywords:
|
| 183 |
for client in google_clients:
|
| 184 |
google_suggestions = fetch_google_suggestions(exp_keyword, client=client)
|
| 185 |
google_suggestions_all.extend(google_suggestions)
|
|
|
|
| 186 |
for suggestion in google_suggestions:
|
| 187 |
all_suggestions.setdefault(suggestion, {"count": 0, "sources": set()})
|
| 188 |
-
all_suggestions[suggestion]["count"] += 1
|
| 189 |
all_suggestions[suggestion]["sources"].add(f"Google ({client})")
|
| 190 |
|
| 191 |
-
#
|
|
|
|
|
|
|
|
|
|
|
|
|
| 192 |
for exp_keyword in expanded_keywords:
|
| 193 |
suggestions = fetch_duckduckgo_suggestions(exp_keyword)
|
| 194 |
duckduckgo_suggestions_all.extend(suggestions)
|
|
@@ -197,7 +96,7 @@ def main(keyword):
|
|
| 197 |
all_suggestions[suggestion]["count"] += 1
|
| 198 |
all_suggestions[suggestion]["sources"].add('DuckDuckGo')
|
| 199 |
|
| 200 |
-
# Obtener sugerencias de YouTube (API anterior y nueva)
|
| 201 |
for exp_keyword in expanded_keywords:
|
| 202 |
suggestions = fetch_youtube_suggestions(exp_keyword)
|
| 203 |
youtube_suggestions_all.extend(suggestions)
|
|
@@ -208,7 +107,7 @@ def main(keyword):
|
|
| 208 |
all_suggestions[suggestion]["count"] += 1
|
| 209 |
all_suggestions[suggestion]["sources"].add('YouTube')
|
| 210 |
|
| 211 |
-
# Obtener sugerencias de Bing
|
| 212 |
for exp_keyword in expanded_keywords:
|
| 213 |
suggestions = fetch_bing_suggestions(exp_keyword)
|
| 214 |
bing_suggestions_all.extend(suggestions)
|
|
@@ -217,7 +116,7 @@ def main(keyword):
|
|
| 217 |
all_suggestions[suggestion]["count"] += 1
|
| 218 |
all_suggestions[suggestion]["sources"].add('Bing')
|
| 219 |
|
| 220 |
-
# Obtener sugerencias de Amazon
|
| 221 |
for exp_keyword in expanded_keywords:
|
| 222 |
suggestions = fetch_amazon_suggestions(exp_keyword)
|
| 223 |
amazon_suggestions_all.extend(suggestions)
|
|
@@ -226,7 +125,7 @@ def main(keyword):
|
|
| 226 |
all_suggestions[suggestion]["count"] += 1
|
| 227 |
all_suggestions[suggestion]["sources"].add('Amazon')
|
| 228 |
|
| 229 |
-
# Obtener sugerencias de Qwant
|
| 230 |
for exp_keyword in expanded_keywords:
|
| 231 |
suggestions = fetch_qwant_suggestions(exp_keyword)
|
| 232 |
qwant_suggestions_all.extend(suggestions)
|
|
@@ -235,7 +134,7 @@ def main(keyword):
|
|
| 235 |
all_suggestions[suggestion]["count"] += 1
|
| 236 |
all_suggestions[suggestion]["sources"].add('Qwant')
|
| 237 |
|
| 238 |
-
# Obtener sugerencias de Brave
|
| 239 |
for exp_keyword in expanded_keywords:
|
| 240 |
suggestions = fetch_brave_suggestions(exp_keyword)
|
| 241 |
brave_suggestions_all.extend(suggestions)
|
|
@@ -244,7 +143,7 @@ def main(keyword):
|
|
| 244 |
all_suggestions[suggestion]["count"] += 1
|
| 245 |
all_suggestions[suggestion]["sources"].add('Brave')
|
| 246 |
|
| 247 |
-
# Calcular relevancia combinada:
|
| 248 |
combined_suggestions = sorted(all_suggestions.items(), key=lambda item: (len(item[1]["sources"]), item[1]["count"]), reverse=True)
|
| 249 |
|
| 250 |
# Obtener las top 3 de cada plataforma
|
|
|
|
| 24 |
else:
|
| 25 |
return []
|
| 26 |
|
| 27 |
+
# Funci贸n para obtener sugerencias de Brave (se reduce en un 65% el impacto)
|
| 28 |
def fetch_brave_suggestions(query, lang_code="es"):
|
| 29 |
encoded_query = urllib.parse.quote(query)
|
| 30 |
url = f"https://search.brave.com/api/suggest?q={encoded_query}"
|
|
|
|
| 33 |
try:
|
| 34 |
data = response.json()
|
| 35 |
if len(data) > 1 and isinstance(data[1], list):
|
| 36 |
+
# Reducir repeticiones en un 65%
|
| 37 |
+
return [normalize_keyword(item) for item in data[1] for _ in range(int(0.35 * 5))] # 65% menos
|
| 38 |
else:
|
| 39 |
print("No se encontraron sugerencias en el formato esperado (Brave).")
|
| 40 |
return []
|
|
|
|
| 44 |
else:
|
| 45 |
return []
|
| 46 |
|
| 47 |
+
# Otras funciones como Qwant, DuckDuckGo, YouTube, Bing, Amazon se mantienen igual (omitidas aqu铆 por brevedad)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 48 |
|
| 49 |
# Funci贸n para expandir la palabra clave
|
| 50 |
def expand_keyword(keyword):
|
|
|
|
| 73 |
|
| 74 |
# Obtener sugerencias de Google con diferentes clients
|
| 75 |
google_clients = ["firefox", "chrome", "android", "desktop", "opera"]
|
| 76 |
+
google_combined = Counter() # Contador combinado para sumar todas las sugerencias de Google
|
| 77 |
for exp_keyword in expanded_keywords:
|
| 78 |
for client in google_clients:
|
| 79 |
google_suggestions = fetch_google_suggestions(exp_keyword, client=client)
|
| 80 |
google_suggestions_all.extend(google_suggestions)
|
| 81 |
+
google_combined.update(google_suggestions) # Sumar las repeticiones de cada cliente de Google
|
| 82 |
for suggestion in google_suggestions:
|
| 83 |
all_suggestions.setdefault(suggestion, {"count": 0, "sources": set()})
|
|
|
|
| 84 |
all_suggestions[suggestion]["sources"].add(f"Google ({client})")
|
| 85 |
|
| 86 |
+
# Al final de todas las consultas a Google, combinamos las repeticiones en una 煤nica fuente de Google
|
| 87 |
+
for suggestion, count in google_combined.items():
|
| 88 |
+
all_suggestions[suggestion]["count"] += count
|
| 89 |
+
|
| 90 |
+
# Obtener sugerencias de DuckDuckGo (se mantiene sin cambios)
|
| 91 |
for exp_keyword in expanded_keywords:
|
| 92 |
suggestions = fetch_duckduckgo_suggestions(exp_keyword)
|
| 93 |
duckduckgo_suggestions_all.extend(suggestions)
|
|
|
|
| 96 |
all_suggestions[suggestion]["count"] += 1
|
| 97 |
all_suggestions[suggestion]["sources"].add('DuckDuckGo')
|
| 98 |
|
| 99 |
+
# Obtener sugerencias de YouTube (API anterior y nueva) (sin cambios)
|
| 100 |
for exp_keyword in expanded_keywords:
|
| 101 |
suggestions = fetch_youtube_suggestions(exp_keyword)
|
| 102 |
youtube_suggestions_all.extend(suggestions)
|
|
|
|
| 107 |
all_suggestions[suggestion]["count"] += 1
|
| 108 |
all_suggestions[suggestion]["sources"].add('YouTube')
|
| 109 |
|
| 110 |
+
# Obtener sugerencias de Bing (se mantiene sin cambios)
|
| 111 |
for exp_keyword in expanded_keywords:
|
| 112 |
suggestions = fetch_bing_suggestions(exp_keyword)
|
| 113 |
bing_suggestions_all.extend(suggestions)
|
|
|
|
| 116 |
all_suggestions[suggestion]["count"] += 1
|
| 117 |
all_suggestions[suggestion]["sources"].add('Bing')
|
| 118 |
|
| 119 |
+
# Obtener sugerencias de Amazon (se mantiene sin cambios)
|
| 120 |
for exp_keyword in expanded_keywords:
|
| 121 |
suggestions = fetch_amazon_suggestions(exp_keyword)
|
| 122 |
amazon_suggestions_all.extend(suggestions)
|
|
|
|
| 125 |
all_suggestions[suggestion]["count"] += 1
|
| 126 |
all_suggestions[suggestion]["sources"].add('Amazon')
|
| 127 |
|
| 128 |
+
# Obtener sugerencias de Qwant (se mantiene sin cambios)
|
| 129 |
for exp_keyword in expanded_keywords:
|
| 130 |
suggestions = fetch_qwant_suggestions(exp_keyword)
|
| 131 |
qwant_suggestions_all.extend(suggestions)
|
|
|
|
| 134 |
all_suggestions[suggestion]["count"] += 1
|
| 135 |
all_suggestions[suggestion]["sources"].add('Qwant')
|
| 136 |
|
| 137 |
+
# Obtener sugerencias de Brave (reducidas en un 65%)
|
| 138 |
for exp_keyword in expanded_keywords:
|
| 139 |
suggestions = fetch_brave_suggestions(exp_keyword)
|
| 140 |
brave_suggestions_all.extend(suggestions)
|
|
|
|
| 143 |
all_suggestions[suggestion]["count"] += 1
|
| 144 |
all_suggestions[suggestion]["sources"].add('Brave')
|
| 145 |
|
| 146 |
+
# Calcular relevancia combinada: basado en cu谩ntos buscadores mencionan una palabra y cu谩ntas veces se repite
|
| 147 |
combined_suggestions = sorted(all_suggestions.items(), key=lambda item: (len(item[1]["sources"]), item[1]["count"]), reverse=True)
|
| 148 |
|
| 149 |
# Obtener las top 3 de cada plataforma
|