| # =========================================== | |
| # Environment Configuration for Digi-Biz | |
| # =========================================== | |
| # Copy this file to .env and fill in your values | |
| # =========================================== | |
| # Groq API (for text AND vision LLM tasks) | |
| # Get key from: https://console.groq.com | |
| # =========================================== | |
| GROQ_API_KEY=gsk_your_api_key_here | |
| # Model for text tasks (schema mapping, classification) | |
| GROQ_MODEL=gpt-oss-120b | |
| # Model for vision tasks (image analysis) | |
| # Current model: meta-llama/llama-4-scout-17b-16e-instruct | |
| GROQ_VISION_MODEL=meta-llama/llama-4-scout-17b-16e-instruct | |
| # =========================================== | |
| # Ollama Configuration (for Vision) | |
| # =========================================== | |
| # Local Ollama host (default is fine for local setup) | |
| OLLAMA_HOST=http://localhost:11434 | |
| # Vision model for image analysis | |
| OLLAMA_VISION_MODEL=qwen3.5:0.8b | |
| # =========================================== | |
| # Application Settings | |
| # =========================================== | |
| # Application environment (development, production) | |
| APP_ENV=development | |
| # Log level (DEBUG, INFO, WARNING, ERROR, CRITICAL) | |
| LOG_LEVEL=INFO | |
| # Maximum file size for ZIP uploads (in bytes) | |
| # Default: 500MB | |
| MAX_FILE_SIZE=524288000 | |
| # Maximum files per ZIP | |
| MAX_FILES_PER_ZIP=100 | |
| # =========================================== | |
| # Storage Configuration | |
| # =========================================== | |
| # Base directory for all storage | |
| STORAGE_BASE=./storage | |
| # Subdirectories (relative to STORAGE_BASE) | |
| UPLOADS_DIR=uploads | |
| EXTRACTED_DIR=extracted | |
| PROFILES_DIR=profiles | |
| INDEX_DIR=index | |
| TEMP_DIR=temp | |
| # =========================================== | |
| # Processing Settings | |
| # =========================================== | |
| # Number of concurrent document parsing tasks | |
| MAX_CONCURRENT_PARSING=5 | |
| # Number of concurrent image analysis tasks | |
| MAX_CONCURRENT_VISION=3 | |
| # Timeout for document parsing (seconds) | |
| PARSING_TIMEOUT=300 | |
| # Timeout for LLM requests (seconds) | |
| LLM_TIMEOUT=60 | |
| # =========================================== | |
| # Optional: OCR Settings (for scanned PDFs) | |
| # =========================================== | |
| # Enable OCR fallback for scanned PDFs | |
| ENABLE_OCR_FALLBACK=true | |
| # Tesseract executable path (leave empty for default) | |
| TESSERACT_PATH= | |
| # =========================================== | |
| # Optional: Rate Limiting | |
| # =========================================== | |
| # Groq API requests per minute | |
| GROQ_RATE_LIMIT=30 | |
| # Ollama requests per minute (local, but manage concurrency) | |
| OLLAMA_RATE_LIMIT=20 | |