reference_page_finder_api

Sleeping

Arafath10 commited on Aug 2, 2024

Commit

38f11d6

verified ·

1 Parent(s): 5722adc

Update main.py

Files changed (1) hide show

main.py CHANGED Viewed

@@ -20,6 +20,8 @@ app.add_middleware(
 @app.post("/get_n_depth_results")
 async def get_n_depth_results(url,input_query):
     all_content = {}
     def add_pdf_content(selected_pdf):
@@ -109,31 +111,33 @@ async def get_n_depth_results(url,input_query):
             futures = [executor.submit(scrapper, input_url) for input_url in (json.loads(input_url)[:2])]
             for future in concurrent.futures.as_completed(futures):
                 next_urls.append(separate_pdf_and_nonPDF_links(future.result()))
         selected_links_from_llm = call_llm_service(next_urls, input_url, input_query, "")
         input_url = selected_links_from_llm
         print(json.loads(input_url)[:2])
     if not pdf_urls:
         print(pdf_urls)
         #return all_content.keys()
         return all_content
     else:
-        selected_pdf = json.loads(call_llm_service(pdf_urls, input_url, input_query, "only end with .pdf extension"))
         print(pdf_urls)
-        print("selected pdf")
-        print(selected_pdf)
         #return all_content.keys()
         return all_content
-# # Start time
-# start_time = time.time()
-# print(main("https://www.keells.com/", "Please analyse reports"))
-# # End time
-# end_time = time.time()
-# # Calculate the time taken
-# time_taken = end_time - start_time
-# print(f"Time taken: {time_taken} seconds")

 @app.post("/get_n_depth_results")
 async def get_n_depth_results(url,input_query):
+    # Start time
+    start_time = time.time()
     all_content = {}
     def add_pdf_content(selected_pdf):
             futures = [executor.submit(scrapper, input_url) for input_url in (json.loads(input_url)[:2])]
             for future in concurrent.futures.as_completed(futures):
                 next_urls.append(separate_pdf_and_nonPDF_links(future.result()))
+        if step==2:
+            break
         selected_links_from_llm = call_llm_service(next_urls, input_url, input_query, "")
         input_url = selected_links_from_llm
         print(json.loads(input_url)[:2])
+    # End time
+    end_time = time.time()
+    # Calculate the time taken
+    time_taken = end_time - start_time
+    print(f"Time taken: {time_taken} seconds")
     if not pdf_urls:
         print(pdf_urls)
         #return all_content.keys()
         return all_content
     else:
+        #selected_pdf = json.loads(call_llm_service(pdf_urls, input_url, input_query, "only end with .pdf extension"))
         print(pdf_urls)
+        #print("selected pdf")
+        #print(selected_pdf)
         #return all_content.keys()
         return all_content
+#print(main("https://www.keells.com/", "Please analyse reports"))