Digi-Biz / .env.example
Deployment Bot
Automated deployment to Hugging Face
255cbd1
# ===========================================
# Environment Configuration for Digi-Biz
# ===========================================
# Copy this file to .env and fill in your values
# ===========================================
# Groq API (for text AND vision LLM tasks)
# Get key from: https://console.groq.com
# ===========================================
GROQ_API_KEY=gsk_your_api_key_here
# Model for text tasks (schema mapping, classification)
GROQ_MODEL=gpt-oss-120b
# Model for vision tasks (image analysis)
# Current model: meta-llama/llama-4-scout-17b-16e-instruct
GROQ_VISION_MODEL=meta-llama/llama-4-scout-17b-16e-instruct
# ===========================================
# Ollama Configuration (for Vision)
# ===========================================
# Local Ollama host (default is fine for local setup)
OLLAMA_HOST=http://localhost:11434
# Vision model for image analysis
OLLAMA_VISION_MODEL=qwen3.5:0.8b
# ===========================================
# Application Settings
# ===========================================
# Application environment (development, production)
APP_ENV=development
# Log level (DEBUG, INFO, WARNING, ERROR, CRITICAL)
LOG_LEVEL=INFO
# Maximum file size for ZIP uploads (in bytes)
# Default: 500MB
MAX_FILE_SIZE=524288000
# Maximum files per ZIP
MAX_FILES_PER_ZIP=100
# ===========================================
# Storage Configuration
# ===========================================
# Base directory for all storage
STORAGE_BASE=./storage
# Subdirectories (relative to STORAGE_BASE)
UPLOADS_DIR=uploads
EXTRACTED_DIR=extracted
PROFILES_DIR=profiles
INDEX_DIR=index
TEMP_DIR=temp
# ===========================================
# Processing Settings
# ===========================================
# Number of concurrent document parsing tasks
MAX_CONCURRENT_PARSING=5
# Number of concurrent image analysis tasks
MAX_CONCURRENT_VISION=3
# Timeout for document parsing (seconds)
PARSING_TIMEOUT=300
# Timeout for LLM requests (seconds)
LLM_TIMEOUT=60
# ===========================================
# Optional: OCR Settings (for scanned PDFs)
# ===========================================
# Enable OCR fallback for scanned PDFs
ENABLE_OCR_FALLBACK=true
# Tesseract executable path (leave empty for default)
TESSERACT_PATH=
# ===========================================
# Optional: Rate Limiting
# ===========================================
# Groq API requests per minute
GROQ_RATE_LIMIT=30
# Ollama requests per minute (local, but manage concurrency)
OLLAMA_RATE_LIMIT=20