Spaces:

TharanJ
/

Insurance_Agent

Sleeping

App Files Files Community

TharanJ commited on Aug 10, 2025

Commit

e4c6be7

1 Parent(s): f9fa975

Prompt changes

Browse files

Files changed (1) hide show

llm.py +4 -25

llm.py CHANGED Viewed

@@ -31,20 +31,10 @@ def extract_https_links(chunks):
 def fetch_all_links(links, timeout=10, max_workers=10):
     """
     Fetch all HTTPS links in parallel, with per-link timing.
-    Skips banned links.
     Returns a dict {link: content or error}.
     """
     fetched_data = {}
-    banned_links = [
-        "https://register.hackrx.in/teams/public/flights/getFirstCityFlightNumber",
-        "https://register.hackrx.in/teams/public/flights/getSecondCityFlightNumber",
-        "https://register.hackrx.in/teams/public/flights/getFourthCityFlightNumber",
-        "https://register.hackrx.in/teams/public/flights/getFifthCityFlightNumber",
-    ]
-    special_url = "https://register.hackrx.in/submissions/myFavouriteCity"
     def fetch(link):
         start = time.perf_counter()
         try:
@@ -58,29 +48,18 @@ def fetch_all_links(links, timeout=10, max_workers=10):
             print(f"❌ {link} — {elapsed:.2f}s — ERROR: {e}")
             return link, f"ERROR: {e}"
-    # Filter banned links first
-    links_to_fetch = [l for l in links if l not in banned_links]
-    for banned in set(links) - set(links_to_fetch):
-        print(f"⛔ Skipped banned link: {banned}")
-        fetched_data[banned] = "BANNED"
-    # Fetch special_url first if present
-    if special_url in links_to_fetch:
-        link, content = fetch(special_url)
-        fetched_data[link] = content
-        links_to_fetch.remove(special_url)
-    # Fetch the rest in parallel
     t0 = time.perf_counter()
     with ThreadPoolExecutor(max_workers=max_workers) as executor:
-        future_to_link = {executor.submit(fetch, link): link for link in links_to_fetch}
         for future in as_completed(future_to_link):
             link, content = future.result()
             fetched_data[link] = content
-    print(f"[TIMER] Total link fetching: {time.perf_counter() - t0:.2f}s")
     return fetched_data
 def query_gemini(questions, contexts, max_retries=3):
     import itertools

 def fetch_all_links(links, timeout=10, max_workers=10):
     """
     Fetch all HTTPS links in parallel, with per-link timing.
     Returns a dict {link: content or error}.
     """
     fetched_data = {}
     def fetch(link):
         start = time.perf_counter()
         try:
             print(f"❌ {link} — {elapsed:.2f}s — ERROR: {e}")
             return link, f"ERROR: {e}"
+    # Fetch all links in parallel (no banned filtering, no special prioritization)
     t0 = time.perf_counter()
     with ThreadPoolExecutor(max_workers=max_workers) as executor:
+        future_to_link = {executor.submit(fetch, link): link for link in links}
         for future in as_completed(future_to_link):
             link, content = future.result()
             fetched_data[link] = content
+    print(f"[TIMER] Total link fetching: {time.perf_counter() - t0:.2f}s")
     return fetched_data
 def query_gemini(questions, contexts, max_retries=3):
     import itertools