New_Final_Assignment

Sleeping

App Files Files Community

naman1102 commited on Jun 2, 2025

Commit

838224c

1 Parent(s): fa1d537

Update tools.py

Browse files

Files changed (1) hide show

tools.py +6 -5

tools.py CHANGED Viewed

@@ -22,10 +22,11 @@ def _download_file_for_task(task_id: str, ext: str) -> str:
     os.makedirs("hf_files", exist_ok=True)
     local_path = os.path.join("hf_files", f"{task_id}.{ext}")
     url = f"{DEFAULT_API_URL}/files/{task_id}"
-    print(f"Downloading file from {url} to {local_path}")
     try:
         resp = requests.get(url, timeout=10)
         if resp.status_code == 200 and resp.content:
             with open(local_path, "wb") as f:
                 f.write(resp.content)
             return local_path
@@ -56,7 +57,7 @@ def web_search_tool(state: AgentState) -> AgentState:
             break
         if attempt < max_retries - 1:
             print(f"web_search_result: rate limit error, retrying in 10 seconds")
-            time.sleep(3)
     print(f"web_search_result reached ")
     return {
         "web_search_query": None,
@@ -102,7 +103,7 @@ def ocr_image_tool(state: AgentState) -> AgentState:
         text = pytesseract.image_to_string(img).strip() or "(no visible text)"
     except Exception as e:
         text = f"Error during OCR: {e}"
     return {
         "ocr_path": None,
         "ocr_result": text
@@ -179,7 +180,7 @@ def parse_excel_tool(state: AgentState) -> AgentState:
     # 4) Strip out separator rows and return the table block
     clean_rows = [row for row in table_lines if not re.match(r"^\s*\|\s*-+", row)]
     table_block = "\n".join(clean_rows).strip()
     return {
         "excel_path": None,
         "excel_sheet_name": None,
@@ -258,7 +259,7 @@ def audio_transcriber_tool(state: AgentState) -> AgentState:
         text = response.get("text", "").strip()
     except Exception as e:
         text = f"Error during transcription: {e}"
     return {
         "audio_path": None,
         "transcript": text

     os.makedirs("hf_files", exist_ok=True)
     local_path = os.path.join("hf_files", f"{task_id}.{ext}")
     url = f"{DEFAULT_API_URL}/files/{task_id}"
     try:
         resp = requests.get(url, timeout=10)
         if resp.status_code == 200 and resp.content:
+            print(f"Downloaded file from {url} to {local_path}")
             with open(local_path, "wb") as f:
                 f.write(resp.content)
             return local_path
             break
         if attempt < max_retries - 1:
             print(f"web_search_result: rate limit error, retrying in 10 seconds")
+            time.sleep(4)
     print(f"web_search_result reached ")
     return {
         "web_search_query": None,
         text = pytesseract.image_to_string(img).strip() or "(no visible text)"
     except Exception as e:
         text = f"Error during OCR: {e}"
+    print(f"OCRed as ocr_result: {text}")
     return {
         "ocr_path": None,
         "ocr_result": text
     # 4) Strip out separator rows and return the table block
     clean_rows = [row for row in table_lines if not re.match(r"^\s*\|\s*-+", row)]
     table_block = "\n".join(clean_rows).strip()
+    print(f"Parsed excel as excel_result: {table_block}")
     return {
         "excel_path": None,
         "excel_sheet_name": None,
         text = response.get("text", "").strip()
     except Exception as e:
         text = f"Error during transcription: {e}"
+    print(f"Transcripted as transcript: {text}")
     return {
         "audio_path": None,
         "transcript": text