Spaces:

BluescarfAI
/

Doc-Processing-Agent

Sleeping

App Files Files Community

dure-waseem commited on Jul 17, 2025

Commit

ae43d88

1 Parent(s): 91881f8

initial code

Browse files

Files changed (6) hide show

config/agents.yaml +8 -0
config/tasks.yaml +9 -0
crew.py +111 -0
main.py +247 -0
requirements.txt +2 -0
tools/custom_tool.py +91 -0

config/agents.yaml ADDED Viewed

	@@ -0,0 +1,8 @@

+document_analyst:
+  role: >
+    Senior Document Analyst
+  goal: >
+    To analyze the document
+  backstory: >
+    You have a keen eye to details and you are able to analyze the document with precision.
+    You role is to analyze the document and extract the exact information from it.

config/tasks.yaml ADDED Viewed

	@@ -0,0 +1,9 @@

+document_analysis:
+  description: >
+    Analyze the document and extract the exact information from it. {file_path} is the path of the document.
+    {file_type} is the type of the document.
+  expected_output: >
+    The document is analyzed and the exact information is extracted from it.
+    Return in Markdown format.
+  agent: document_analyst

crew.py ADDED Viewed

	@@ -0,0 +1,111 @@

+# from crewai import Agent, Crew, Process, Task, LLM
+# from crewai.project import CrewBase, agent, crew, task
+# from tools.custom_tool import landing_ai_document_analysis
+# from dotenv import load_dotenv
+# import os
+# # from langchain_groq import ChatGroq
+# # Load environment variables
+# load_dotenv()
+# @CrewBase
+# class DocProcessing():
+# 	"""DocProcessing crew"""
+# 	agents_config = 'config/agents.yaml'
+# 	tasks_config = 'config/tasks.yaml'
+# 	llm = LLM(
+# 		model = "claude-3-haiku-20240307",
+# 		api_key = os.getenv("ANTHROPIC_API_KEY"),
+# 		temperature = 0,
+# 		)
+# 	# llm = ChatGroq(
+# 	# 	model = "groq/llama-3.1-8b-instant",
+# 	# 	api_key= os.getenv("GROQ_API_KEY"),
+# 	# )
+# 	@agent
+# 	def document_analyst(self) -> Agent:
+# 		return Agent(
+# 			config=self.agents_config['document_analyst'],
+# 			verbose=True,
+# 			tools=[landing_ai_document_analysis],
+# 			llm=self.llm,
+# 		)
+# 	@task
+# 	def document_analysis(self) -> Task:
+# 		return Task(
+# 			config=self.tasks_config['document_analysis'],
+# 		)
+# 	@crew
+# 	def crew(self) -> Crew:
+# 		"""Creates the DocProcessing crew"""
+# 		return Crew(
+# 			agents=self.agents, # Automatically created by the @agent decorator
+# 			tasks=self.tasks, # Automatically created by the @task decorator
+# 			process=Process.sequential,
+# 			verbose=True,
+# 		)
+from crewai import Agent, Crew, Process, Task, LLM
+from crewai.project import CrewBase, agent, crew, task
+from tools.custom_tool import landing_ai_document_analysis
+import os
+@CrewBase
+class DocProcessing():
+	"""DocProcessing crew for document analysis"""
+	agents_config = 'config/agents.yaml'
+	tasks_config = 'config/tasks.yaml'
+	def __init__(self):
+		"""Initialize the DocProcessing crew with API key validation."""
+		super().__init__()
+		# Get API key from environment variable (set at runtime)
+		anthropic_api_key = os.getenv("ANTHROPIC_API_KEY")
+		if not anthropic_api_key:
+			raise ValueError("ANTHROPIC_API_KEY environment variable is required")
+		self.llm = LLM(
+			model="claude-3-haiku-20240307",
+			api_key=anthropic_api_key,
+			temperature=0,
+		)
+	@agent
+	def document_analyst(self) -> Agent:
+		return Agent(
+			config=self.agents_config['document_analyst'],
+			verbose=True,
+			tools=[landing_ai_document_analysis],
+			llm=self.llm,
+		)
+	@task
+	def document_analysis(self) -> Task:
+		return Task(
+			config=self.tasks_config['document_analysis'],
+		)
+	@crew
+	def crew(self) -> Crew:
+		"""Creates the DocProcessing crew"""
+		return Crew(
+			agents=self.agents, # Automatically created by the @agent decorator
+			tasks=self.tasks, # Automatically created by the @task decorator
+			process=Process.sequential,
+			verbose=True,
+		)

main.py ADDED Viewed

	@@ -0,0 +1,247 @@

+# #!/usr/bin/env python
+# import sys
+# import os
+# import warnings
+# from crew import DocProcessing
+# warnings.filterwarnings("ignore", category=SyntaxWarning, module="pysbd")
+# def determine_file_type(file_path):
+#     """
+#     Determine the file type based on the file extension.
+#     Args:
+#         file_path (str): Path to the file
+#     Returns:
+#         str: 'pdf' if the file is a PDF, 'image' otherwise
+#     """
+#     _, ext = os.path.splitext(file_path)
+#     if ext.lower() == '.pdf':
+#         return 'pdf'
+#     return 'image'
+# def run():
+#     """
+#     Run the crew with file paths received from command line arguments.
+#     """
+#     # Get file paths from command line arguments
+#     file_paths = sys.argv[1:] if len(sys.argv) > 1 else []
+#     if not file_paths:
+#         print("No file paths provided. Usage: python main.py <file_path1> <file_path2> ...")
+#         return
+#     # Process the first file (you can modify this to handle multiple files if needed)
+#     file_path = file_paths[0]
+#     file_type = determine_file_type(file_path)
+#     print(f"Processing file: {file_path} (type: {file_type})")
+#     # Prepare inputs for the CrewAI
+#     inputs = {
+#         "file_path": file_path,
+#         "file_type": file_type,
+#     }
+#     try:
+#         # Pass the inputs to the crew kickoff method
+#         result = DocProcessing().crew().kickoff(inputs=inputs)
+#         return result
+#     except Exception as e:
+#         error_msg = f"An error occurred while running the crew: {e}"
+#         print(error_msg)
+#         raise Exception(error_msg)
+# if __name__ == "__main__":
+#     run()
+#!/usr/bin/env python
+import os
+import tempfile
+import gradio as gr
+import warnings
+from crew import DocProcessing
+warnings.filterwarnings("ignore", category=SyntaxWarning, module="pysbd")
+def determine_file_type(file_path):
+    """
+    Determine the file type based on the file extension.
+    Args:
+        file_path (str): Path to the file
+    Returns:
+        str: 'pdf' if the file is a PDF, 'image' otherwise
+    """
+    _, ext = os.path.splitext(file_path)
+    if ext.lower() == '.pdf':
+        return 'pdf'
+    return 'image'
+def process_document(file, anthropic_api_key, landing_ai_api_key):
+    """
+    Process the uploaded document using CrewAI.
+    Args:
+        file: Uploaded file from Gradio
+        anthropic_api_key (str): Anthropic API key
+        landing_ai_api_key (str): LandingAI API key
+    Returns:
+        str: Processing results or error message
+    """
+    try:
+        # Validate inputs
+        if file is None:
+            return "❌ Please upload a file first."
+        if not anthropic_api_key.strip():
+            return "❌ Please provide your Anthropic API key."
+        if not landing_ai_api_key.strip():
+            return "❌ Please provide your LandingAI API key."
+        # Set environment variables securely for this session
+        os.environ["ANTHROPIC_API_KEY"] = anthropic_api_key.strip()
+        os.environ["LANDING_AI_API_KEY"] = landing_ai_api_key.strip()
+        # Get file path and determine type
+        file_path = file.name
+        file_type = determine_file_type(file_path)
+        print(f"Processing file: {file_path} (type: {file_type})")
+        # Prepare inputs for CrewAI
+        inputs = {
+            "file_path": file_path,
+            "file_type": file_type,
+        }
+        # Process with CrewAI
+        result = DocProcessing().crew().kickoff(inputs=inputs)
+        # Clean up environment variables for security
+        if "ANTHROPIC_API_KEY" in os.environ:
+            del os.environ["ANTHROPIC_API_KEY"]
+        if "LANDING_AI_API_KEY" in os.environ:
+            del os.environ["LANDING_AI_API_KEY"]
+        return f"✅ **Processing Complete!**\n\n{result}"
+    except Exception as e:
+        # Clean up environment variables even on error
+        if "ANTHROPIC_API_KEY" in os.environ:
+            del os.environ["ANTHROPIC_API_KEY"]
+        if "LANDING_AI_API_KEY" in os.environ:
+            del os.environ["LANDING_AI_API_KEY"]
+        error_msg = f"❌ **Error occurred:** {str(e)}"
+        print(error_msg)
+        return error_msg
+# Create Gradio interface
+def create_interface():
+    """Create and return the Gradio interface."""
+    with gr.Blocks(
+        title="Document Analysis with CrewAI",
+        theme=gr.themes.Soft(),
+        css="""
+        .container {
+            max-width: 800px;
+            margin: auto;
+        }
+        .header {
+            text-align: center;
+            margin-bottom: 30px;
+        }
+        .api-section {
+            background-color: #f8f9fa;
+            padding: 20px;
+            border-radius: 10px;
+            margin-bottom: 20px;
+        }
+        """
+    ) as demo:
+        gr.HTML("""
+        <div class="header">
+            <h1>🤖 Document Analysis</h1>
+            <p>Upload your documents for intelligent analysis using AI agents</p>
+        </div>
+        """)
+        with gr.Row():
+            with gr.Column():
+                # API Keys Section
+                gr.HTML("<div class='api-section'>")
+                gr.Markdown("### 🔑 API Keys")
+                gr.Markdown("Enter your API keys below. They are used securely and not stored.")
+                anthropic_key = gr.Textbox(
+                    label="Anthropic API Key",
+                    placeholder="Enter your Anthropic API key...",
+                    type="password",
+                    info="Get your key from: https://console.anthropic.com/"
+                )
+                landing_ai_key = gr.Textbox(
+                    label="LandingAI API Key",
+                    placeholder="Enter your LandingAI API key...",
+                    type="password",
+                    info="Get your key from: https://landing.ai/"
+                )
+                gr.HTML("</div>")
+                # File Upload Section
+                gr.Markdown("### 📄 Upload Document")
+                file_input = gr.File(
+                    label="Select your document (.pdf, .png, .jpg, .jpeg, .bmp, .tiff)",
+                    file_types=[".pdf", ".png", ".jpg", ".jpeg", ".bmp", ".tiff"],
+                    file_count="single"
+                )
+                # Process Button
+                process_btn = gr.Button(
+                    "🚀 Analyze Document",
+                    variant="primary",
+                    size="lg"
+                )
+            with gr.Column():
+                # Results Section
+                gr.Markdown("### 📊 Analysis Results")
+                output = gr.Textbox(
+                    label="Results",
+                    placeholder="Upload a document and click 'Analyze Document' to see results here...",
+                    lines=20,
+                    max_lines=30,
+                    show_copy_button=True
+                )
+        # Examples section
+        # Set up the event handler
+        process_btn.click(
+            fn=process_document,
+            inputs=[file_input, anthropic_key, landing_ai_key],
+            outputs=output,
+            show_progress=True
+        )
+    return demo
+# Launch the application
+if __name__ == "__main__":
+    demo = create_interface()
+    demo.launch(
+        server_name="0.0.0.0",  # Important for HuggingFace deployment
+        server_port=7860,       # Default port for HuggingFace
+        share=False,
+        show_error=True
+    )

requirements.txt ADDED Viewed

	@@ -0,0 +1,2 @@


1	+ gradio
2	+ crewai

tools/custom_tool.py ADDED Viewed

	@@ -0,0 +1,91 @@

+# import os
+# import requests
+# from crewai.tools import tool
+# from dotenv import load_dotenv
+# # Load environment variables
+# load_dotenv()
+# @tool("LandingAI Document Analysis")
+# def landing_ai_document_analysis(file_path: str, file_type: str = "image") -> str:
+#     """
+#     Analyze images or PDFs using LandingAI's document analysis API.
+#     Args:
+#         file_path (str): Path to the image or PDF file to analyze
+#         file_type (str): Type of file, either "image" or "pdf"
+#     Returns:
+#         str: Analysis results from the API
+#     """
+#     # Get API key from environment variable
+#     api_key = os.getenv("LANDING_AI_API_KEY")
+#     # API endpoint
+#     url = "https://api.va.landing.ai/v1/tools/agentic-document-analysis"
+#     # Prepare the file for upload based on file_type
+#     with open(file_path, "rb") as file_obj:
+#         if file_type.lower() == "pdf":
+#             files = {"pdf": file_obj}
+#         else:
+#             files = {"image": file_obj}
+#         # Prepare headers with authentication
+#         headers = {"Authorization": f"Basic {api_key}"}
+#         # Make the API request
+#         response = requests.post(url, files=files, headers=headers)
+#     return response.json()
+import os
+import requests
+from crewai.tools import tool
+@tool("LandingAI Document Analysis")
+def landing_ai_document_analysis(file_path: str, file_type: str = "image") -> str:
+    """
+    Analyze images or PDFs using LandingAI's document analysis API.
+    Args:
+        file_path (str): Path to the image or PDF file to analyze
+        file_type (str): Type of file, either "image" or "pdf"
+    Returns:
+        str: Analysis results from the API
+    """
+    # Get API key from environment variable
+    api_key = os.getenv("LANDING_AI_API_KEY")
+    if not api_key:
+        return "Error: LANDING_AI_API_KEY environment variable is not set"
+    # API endpoint
+    url = "https://api.va.landing.ai/v1/tools/agentic-document-analysis"
+    try:
+        # Prepare the file for upload based on file_type
+        with open(file_path, "rb") as file_obj:
+            if file_type.lower() == "pdf":
+                files = {"pdf": file_obj}
+            else:
+                files = {"image": file_obj}
+            # Prepare headers with authentication
+            headers = {"Authorization": f"Basic {api_key}"}
+            # Make the API request
+            response = requests.post(url, files=files, headers=headers)
+            # Check if request was successful
+            if response.status_code == 200:
+                return response.json()
+            else:
+                return f"API Error: {response.status_code} - {response.text}"
+    except FileNotFoundError:
+        return f"Error: File not found at path: {file_path}"
+    except Exception as e:
+        return f"Error processing file: {str(e)}"