Final_Assignment_Agents

Sleeping

App Files Files Community

ernani commited on Apr 28, 2025

Commit

fb72cf5

1 Parent(s): 5e9938c

Removed chromadb from tools

Browse files

Files changed (1) hide show

tools.py +0 -75

tools.py CHANGED Viewed

@@ -8,8 +8,6 @@ from langchain.text_splitter import RecursiveCharacterTextSplitter
 from langchain_community.tools import WikipediaQueryRun, DuckDuckGoSearchRun
 from langchain_community.document_loaders import PythonLoader
 from langchain_community.utilities import WikipediaAPIWrapper
-import chromadb
-from chromadb.config import Settings
 import pytube
 from PIL import Image
 import pandas as pd
@@ -709,76 +707,3 @@ class WebSearchTool(BaseTool):
         except Exception as e:
             return f"Error searching the web: {str(e)}"
-class ChromaDBManager:
-    """Manager for ChromaDB operations"""
-    def __init__(self, persist_directory: str = "./chroma_db"):
-        self.persist_directory = persist_directory
-        self.client = chromadb.Client(Settings(
-            persist_directory=persist_directory,
-            is_persistent=True
-        ))
-    def create_collection(self, name: str):
-        """Create a new collection or get existing one"""
-        try:
-            return self.client.create_collection(name=name)
-        except ValueError:
-            return self.client.get_collection(name=name)
-    def _generate_document_id(self, content: str, metadata: dict) -> str:
-        """Generate a unique ID for a document based on its content and metadata"""
-        # Use content and key metadata fields for ID generation
-        id_parts = [content[:100]]  # First 100 chars of content
-        if metadata:
-            source = metadata.get('source', '')
-            doc_type = metadata.get('type', '')
-            if source:
-                id_parts.append(str(source))
-            if doc_type:
-                id_parts.append(str(doc_type))
-        # Generate hash from combined parts
-        combined = "_".join(id_parts)
-        return f"doc_{hash(combined)}"
-    def add_documents_with_metadata(self, collection_name: str, documents: List[str], metadatas: List[dict]):
-        """Add documents with their metadata to a collection"""
-        if not documents or not metadatas or len(documents) != len(metadatas):
-            raise ValueError("Invalid documents or metadata")
-        collection = self.create_collection(collection_name)
-        # Generate unique IDs for documents
-        ids = [self._generate_document_id(doc, meta)
-               for doc, meta in zip(documents, metadatas)]
-        try:
-            # First try to add documents
-            collection.add(
-                documents=documents,
-                metadatas=metadatas,
-                ids=ids
-            )
-        except Exception as e:
-            # If documents exist, update them
-            logging.info(f"Updating existing documents in collection {collection_name}")
-            collection.upsert(
-                documents=documents,
-                metadatas=metadatas,
-                ids=ids
-            )
-    def query_collection(self, collection_name: str, query: str, n_results: int = 5) -> Dict:
-        """Query a collection with improved retrieval"""
-        try:
-            collection = self.client.get_collection(collection_name)
-            results = collection.query(
-                query_texts=[query],
-                n_results=n_results
-            )
-            return results
-        except Exception as e:
-            logging.error(f"Error querying collection {collection_name}: {str(e)}")
-            return {"documents": [], "metadatas": [], "distances": []}

 from langchain_community.tools import WikipediaQueryRun, DuckDuckGoSearchRun
 from langchain_community.document_loaders import PythonLoader
 from langchain_community.utilities import WikipediaAPIWrapper
 import pytube
 from PIL import Image
 import pandas as pd
         except Exception as e:
             return f"Error searching the web: {str(e)}"