open-navigator / requirements.txt
jcbowyer's picture
Clean HuggingFace deployment without binary files
61d29fc
# Core Dependencies
python-dotenv==1.0.0
pydantic==2.5.0
pydantic-settings==2.1.0
# Web Scraping & Data Collection
beautifulsoup4==4.12.2
selenium==4.16.0
playwright==1.40.0
httpx>=0.25.0
aiohttp==3.9.1
youtube-transcript-api>=0.6.2
# Document Processing (Multiple Formats)
PyPDF2>=3.0.0 # PDF extraction
pdfplumber>=0.10.0 # Advanced PDF extraction (tables)
python-pptx>=0.6.0 # PowerPoint extraction
python-docx>=1.0.0 # Word document extraction
openpyxl>=3.1.0 # Excel extraction
pytesseract>=0.3.0 # OCR for scanned documents (optional)
Pillow>=10.0.0 # Image processing for OCR
# AI & LLM
openai>=1.6.0
anthropic>=0.8.0
langchain>=0.1.0
langchain-openai>=0.0.2
langchain-community>=0.0.10
langgraph>=0.0.20
langchain-core>=0.1.0
tiktoken>=0.5.0
# Model Context Protocol (MCP) - Optional, for local MCP server only
# mcp>=0.1.0
# Data Processing & Lakehouse
databricks-sdk==0.18.0
delta-spark==3.0.0
pyspark==3.5.0
pandas==2.1.4
polars==0.20.2
pyarrow==14.0.2
duckdb>=0.9.0
# NLP & Text Analysis
spacy==3.7.2
transformers==4.36.2
sentence-transformers==2.2.2
nltk==3.8.1
datasets>=2.16.0
huggingface-hub>=0.20.0
# Database & Storage
sqlalchemy>=2.0.0
chromadb>=0.4.0
qdrant-client>=1.7.0
# API & Web Framework
fastapi==0.109.0
uvicorn[standard]==0.25.0
pydantic[email]==2.5.0
python-multipart==0.0.6
# Authentication & OAuth
python-jose[cryptography]==3.3.0 # JWT tokens
passlib[bcrypt]==1.7.4 # Password hashing
itsdangerous==2.1.2 # Secure tokens
psycopg2-binary==2.9.9 # PostgreSQL driver
asyncpg==0.29.0 # Async PostgreSQL driver (for Neon)
# Visualization
plotly==5.18.0
folium==0.15.1
matplotlib==3.8.2
seaborn==0.13.1
# Utilities
python-dateutil==2.8.2
pytz==2023.3
tenacity==8.2.3
loguru==0.7.2
click==8.1.7
tqdm==4.66.1
# Testing
pytest>=7.4.0
pytest-asyncio>=0.21.0
pytest-cov>=4.1.0
pytest-mock>=3.12.0
pytest-httpx>=0.27.0
# Development
black>=23.0.0
ruff>=0.1.0
mypy>=1.8.0
pre-commit>=3.6.0
# Optional: Google Data Commons Integration
# Recommended for jurisdiction enrichment (replaces manual Census API calls)
# Install with: pip install datacommons datacommons-pandas
# Documentation: https://docs.datacommons.org/api/
# datacommons>=1.4.0
# datacommons-pandas>=0.1.0