Spaces:
Sleeping
Sleeping
Update requirements.txt
Browse files- requirements.txt +46 -24
requirements.txt
CHANGED
|
@@ -1,25 +1,47 @@
|
|
| 1 |
-
# Core Dependencies
|
| 2 |
-
chromadb>=0.4.0 # For vector database functionality
|
| 3 |
-
mistralai>=0.1.1 # For Mistral AI API integration
|
| 4 |
-
langchain>=0.1.0 # For text splitting and utilities
|
| 5 |
-
streamlit>=1.30.0 # For the web app interface
|
| 6 |
-
|
| 7 |
-
# File Processing Dependencies
|
| 8 |
-
|
| 9 |
-
|
| 10 |
-
|
| 11 |
-
|
| 12 |
-
|
| 13 |
-
#
|
| 14 |
-
|
| 15 |
-
|
| 16 |
-
|
| 17 |
-
|
| 18 |
-
|
| 19 |
-
|
| 20 |
-
|
| 21 |
-
|
| 22 |
-
|
| 23 |
-
|
| 24 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 25 |
pandas>=2.0.0 # For spreadsheet processing
|
|
|
|
| 1 |
+
# Core Dependencies
|
| 2 |
+
chromadb>=0.4.0 # For vector database functionality
|
| 3 |
+
mistralai>=0.1.1 # For Mistral AI API integration
|
| 4 |
+
langchain>=0.1.0 # For text splitting and utilities
|
| 5 |
+
streamlit>=1.30.0 # For the web app interface
|
| 6 |
+
|
| 7 |
+
# File Processing Dependencies# Core Dependencies
|
| 8 |
+
chromadb>=0.4.0
|
| 9 |
+
mistralai>=0.5.0 # New Mistral client
|
| 10 |
+
langchain>=0.1.0
|
| 11 |
+
streamlit>=1.30.0
|
| 12 |
+
|
| 13 |
+
# File Processing Dependencies
|
| 14 |
+
pymupdf>=1.23.0
|
| 15 |
+
python-docx>=0.8.11
|
| 16 |
+
pdfplumber>=0.10.0 # Optional
|
| 17 |
+
tika>=2.6.0 # Optional
|
| 18 |
+
|
| 19 |
+
# Utility Dependencies
|
| 20 |
+
python-dotenv>=1.0.0
|
| 21 |
+
numpy>=1.21.0
|
| 22 |
+
typing-extensions>=3.7.4
|
| 23 |
+
loguru>=0.7.0 # Optional
|
| 24 |
+
tqdm>=4.65.0 # Optional
|
| 25 |
+
|
| 26 |
+
# Development Dependencies (optional)
|
| 27 |
+
pytest>=7.0.0
|
| 28 |
+
black>=23.0.0
|
| 29 |
+
flake8>=6.0.0
|
| 30 |
+
pymupdf>=1.23.0 # For PDF text extraction (fitz)
|
| 31 |
+
python-docx>=0.8.11 # For DOCX text extraction
|
| 32 |
+
pdfplumber>=0.10.0 # Alternative PDF text extraction (optional)
|
| 33 |
+
tika>=2.6.0 # For extracting text from other file formats (optional)
|
| 34 |
+
|
| 35 |
+
# Utility Dependencies
|
| 36 |
+
python-dotenv>=1.0.0 # For environment variable management
|
| 37 |
+
numpy>=1.21.0 # For numerical operations (if needed)
|
| 38 |
+
typing-extensions>=3.7.4 # For type hints compatibility
|
| 39 |
+
loguru>=0.7.0 # For enhanced logging (optional, replace with logging if not needed)
|
| 40 |
+
tqdm>=4.65.0 # For progress bars (optional)
|
| 41 |
+
|
| 42 |
+
# Development Dependencies (optional)
|
| 43 |
+
pytest>=7.0.0 # For testing
|
| 44 |
+
black>=23.0.0 # For code formatting
|
| 45 |
+
flake8>=6.0.0 # For linting
|
| 46 |
+
pytesseract>=0.3.10 # For OCR (image text extraction)
|
| 47 |
pandas>=2.0.0 # For spreadsheet processing
|