Spaces:

Makima57
/

query

Sleeping

Makima57 commited on Sep 19, 2024

Commit

80b7575

verified ·

1 Parent(s): 47813a1

Upload app.py with huggingface_hub

Files changed (1) hide show

app.py CHANGED Viewed

@@ -5,28 +5,31 @@ from bs4 import BeautifulSoup
 import requests
 from urllib.parse import urljoin, urlparse
-def search(query, url):
-    if not url.startswith("http"):
-        url = "https://" + url
-    parsed_url = urlparse(url)
-    search_url = f"{parsed_url.scheme}://{parsed_url.netloc}/{query}/"
-    return search_url
 def download_content(url):
     response = requests.get(url)
     return response.text
 st.title("Search and Download")
 query = st.text_input("Enter your query (e.g. beds)")
 url = st.text_input("Enter the URL to search from (e.g. https://www.daraz.com.np/)")
-search_button = st.button("Search")
-if search_button:
-    link = search(query, url)
-    st.write(f"First result: {link}")
-    download_button = st.button("Download Content")
-    if download_button:
-        content = download_content(link)
-        st.download_button("Download", content, file_name="content.html")

 import requests
 from urllib.parse import urljoin, urlparse
+def google_search(query, url):
+    google_url = f"https://www.google.com/search?q={query}+site:{url}"
+    response = requests.get(google_url)
+    soup = BeautifulSoup(response.text, 'html.parser')
+    links = soup.find_all('a')
+    for link in links:
+        href = link.get('href')
+        if href and href.startswith('/url?q='):
+            return href.split('&sa=U&ved=')[0].replace('/url?q=', '')
+    return None
 def download_content(url):
     response = requests.get(url)
     return response.text
 st.title("Search and Download")
 query = st.text_input("Enter your query (e.g. beds)")
 url = st.text_input("Enter the URL to search from (e.g. https://www.daraz.com.np/)")
+if st.button("Search"):
+    link = google_search(query, url)
+    if link:
+        st.write("First result:", link)
+        if st.button("Download content"):
+            content = download_content(link)
+            st.download_button("Download", content, file_name="content.html")
+    else:
+        st.write("No results found")